diff --git a/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c842d604b310a3de3165e17ab9ca2859ac51f00 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12659a4910139fa2e804cb0468e1fd3a179d4c42742fc2286ec9a6614287079 +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..611c7f12d10affc4e87e69082cb6c0381bac380b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2e6f915d8492c150f225350e681ca9765788d410ecd6c5eef30ecc3e796a7f +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6973bae966bdcaa0a45e77d593640d2677f75a4a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/0.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f2de2dc3407da2057784cd60f278e0d7fa0922c3da51a5a2f02e76a0e1a595 +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/0.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/0.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcddbe3a897f7ecdd9b362b4a2ac210b2e49baf2 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/0.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9774b0a705bb0324b72b1240816c832de2d0db5fc73f7c37babd9e049f2bca72 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d427778fcfb89829f5b5bbf53619a240b63a29 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5712a302b456a83737f1232981cef28add8233df4151b06bc4cfe53a03bad6ca +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..188d05b6b482656bae29b366dabf003da4914be0 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457d13f684ff6c6c9500e88064ffab200d522851e8ab77c93cff9e6b5680d0ef +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5341494c13a77d49b5e13fe001d635db8a2702c7 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/1.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:401fe7cc0480d8f9dde844e8d758d9986ab071e991f1e41add0494abed9c8736 +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/1.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/1.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..baf112fd308a3fd7c1605bf3cd19cd797cd95242 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/1.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23388e4c6212481f58de414409118fd1efc8c33716714a06495b810d438bf480 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce57cc67d465ac8ff294ed61715ecd9317c50400 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa5b3b9df13620ad8c9189867bb302bcbffa0df54472cc038eb2f4d5c967f73 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff9fdc07d0f731ab5d99ef1b231f4d3b872ac01 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf399bd1d84997b7e9c3af72e8f243ff3016ed033772abd15ac768862531f4cc +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0fd3cab033cd3289bdaee0d207a3ebabe46c688 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/10.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df05be82c0a45483aaf14d466e73b765b0c2bf12b083a8b77ed5acd9a236dd7b +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/10.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/10.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a4411130fd059494180c7d824d16784ca8da92 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/10.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f64d5a0194d78ccbf2cdda8cc1c0a976062bce98a8607f209608c2b3a2ad8f +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/11.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/11.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c38565db53bdf5d4ff9c679eefe21b2eae50d7 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/11.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9557493580b19e0178a3a67f43353b12a79904f4ba09595327d63cb693bac800 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/11.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a8a0bb04f2a66f0dea15b08eef8779fbbfe2fc --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9345ee292e45d16720b469a8a487b6bd69659845c8a3fde98e8c0264fb5cb14 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/11.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..feed166ffde9a575a0e1275abc6843d1b2154b18 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab08e90f3fe7406117a97ce7ee18b23892c2bc7a0aa276d2886764cbe3bdbb0 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/11.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c03b6d0db157e69a4f9d1d2b1acf335403253e0 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3ba5850b2d471dd7d9712ad6cd5a7eecd23368329f3f2e3353f48289493743 +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/11.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6f6b1fea5ed42c12d0b319cbb12a80af9ebf16a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/11.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ff8a86f2f0b8effdf2f1f822067cecd4207ddbb0d579b5df98c8f186dde39b +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..becd97fa98bccb9bf33680b9d90f68fa5dcb996e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ad7bfc96c6899f58815e01a2d65fe92495ea37288b94fe5d58915b24cc7b90 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aaf99411ae517e689f7472be12b32f43de7b3ac --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b62e0433748cd57eef0f1721a0c2311a2a7ab19357d26b2593a7db193e6b6c +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ced4dbf08dbf2635a258d694e61c82b1ea1ac2c9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/12.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e973f305b6024c8bb74f9465ef31ae7a5beaf2c36b486bfbfc98c1207cc3893a +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/12.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/12.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dbb73758acf00036ccf42f31292277c899e82fb --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/12.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5783a331c889dd8beb31eb64ff4278d24d60098352706b8f9abfaa87d339dc45 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f19df7650f6107e2dbeade15863ab6af1659b9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffd301764bfa503bc5e68251293f21d9f3b8b60c0be7c207d6db8f65159566d +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4e0f949e17cbc2bf3e028050b6cc9340a1391fa --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820940c1c3d7b2f4aee16d1f2c3a56f91284e8ed6b3e742753659eed47d5e101 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ffc2a4f17d32cc5dc569e1f2ee6424accb0d2b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/13.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c317e8ca5a7a01472e9a9b5e806f5ab0ca914c69d984004fd32fd84edd423746 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/13.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/13.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..7307f1f0d204bda5e1ff079dcf77376b6dada7bb --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/13.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22356a9e7f70ee25460b03167e776d4534d90560a45c3b36a21f05a202efdf2c +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f41dcf24441931fe6ed92535d96ff5b2ab41ac3 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfeb5c7c94aa60fcdc43ebc27b936266b0052c2d3de70fb934b57649547dc0d5 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..91760db6b346d95b4e29133700120aa28b562d0b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f26b85edb2f51a1e2123d2ac9e48993cff95f8738ed36d1ac8946197b4990c05 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5997191f3513b6ff13e978074a5534a6f585abd --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/14.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1b62f2ed9698bc70a9ed1b117849e370aa13185c2564221d7fd7adc2cbca20 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/14.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/14.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df3501fd309b2641ccedd2caf7cc232715c41a3 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/14.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c56b3a6c611fe38cd537106af94a73d94d0a72c45c977b1d342a00579e23e11 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/15.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/15.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..195277d4e53db368d486421af3b1e94e6d9553c9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/15.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b34ebf54f18364d8de6b30393e86c71253aaffda9d86c5127a0537324768d5 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/15.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb063a95adb9ea7a4131d2c7aebccffa9cd8af93 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ffb0419e193b941a0f7f14793cedc4fa795e24f8f69a39a27e42799339d32c +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/15.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..142411381900af30987b727350345d23a7f883a3 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80b2e44b0964f20a40736640b75d3f2e7aae0f417dde972cb80b78349bd3872 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/15.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..571d1aa55c4262bc75aca58a6bc81d5ff7b998b9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c283e9cfcd8149b9f0346a037ef0ddc4e0de152c1c918f8e956da29c0f2cbd +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/15.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..54beeae66a5b00fe7c7cc73e888c371620a8af44 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/15.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9912cd281a7530cc4304a5e3e4655cd2cefec6e42015ce1e9a1f2f5abf5ba685 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..865be25c26da87b8f8eb6af4133066dd0132fccb --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f579d4af503c34af0ccc41f113aec286b274db6f7f09fe154e8fd2866992484 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..5268900071a7869ba4d83c6b563631da47ee091a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efac859cb3efe040396735a509aa9d9c88e35168f83bd763b16748e52b063185 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9006339267b6d4f787203ff923a424c265ea3017 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/16.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6afa85556d07d849f275d633177f00c6a7f76be14a6848f397ee0278765cf63 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/16.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/16.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..524caf6fa3452d6d3b8a2721370a9d7673d3d9da --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/16.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3711ecee30c6920f085971a6f9a0ee1d76e3745b05548b46d32b14b1570a1182 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff0c45a835641999eaec47ae826481e07ad7484c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10f86dcce62bb6884bd64ae03fdd15b43eba0825f8037531081633f0e068baa +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7fe63a3a443901605444116098fc750a599fe2 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126ae4edd6ab46bacbd0698b33d6977b693af6538f068d707df2ca8250d8a17d +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e33fca91c2828abaf64142d706659cb50dcdca1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/17.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b46e5dcdeb6e6eb5c4be6db2f6f37f8bbb0d1654449b41b16a76c14701b6a148 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/17.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/17.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a39359a08168fdcd0df1ba5e97956fa86d850b7 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/17.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b878ee8f7f745ef8298ed69a21c3708510a3d101afb5173452f1fb30582bfef +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..d870a98a634ddb438b827b04979d1f05aa74ae5b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd2a7abb9ad1bd5e1f2e12fb58861469cb7a4cf4727f191d187c7070d376497 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..594f3ca200624c2d357a2521062ee3566b640cbf --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb8210345da026167f3462b773e1fd80c50892f472433c58802f52c43da7803d +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab0a90ece8bcba5db194a19bbbea5dca080bd4e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/18.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4332ef552fe3146cbedbdf759320786780537f0c4f2854563241b6bd94f9ef1e +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/18.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/18.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff743eadc9b633221e7505be685cb5a1dfe85d9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/18.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649314e471113270aebb8a9f0af7f5827c0f22cdc3fc1acfd2fd9257e71a926d +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/19.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/19.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..b823b7ef19b8e4f4029911d6d9777a21313b79b9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/19.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2e2ce817de178ac0d754af28a2c2bf041ee76a052a8c5eb058ba816688e0ab +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/19.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..201952cae28101ae441ec7ec6ef0b2a7d1213c81 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f35b9bcb809f5f8a5f62bf81319e1e4b3025392f8522ce5cac70ad019661e69 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/19.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..845d8a28f6bf25de0f8c1ae5fb58f55572db976a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83922052c71465cbdb2d670c2bcb9ddab064c9cf1fd7f37c84cb9787b88fd6c +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/19.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..124f9f6d281483aea951027274160f2a0cdcae12 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a59b6311a8df5d730f57c743864e643a8ecb761aab3de3973820b3cb4ec108 +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/19.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dbf6fe73f70543a139298d70e5bf056fbadb5b7 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/19.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797f3304af21140817d616c15fd56742e39ff76d93a73dccffaf53b8963016e2 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd50bb2561983c19ecafa786445cb160f9e8c5f6 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b942d8cdb821d698cec287ccf2e6ae9840f99aa2f3ff09682af8e65e9f1970a +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..377f80d4f00808d781770ff343c19a8082a32e3c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740a7062a375872dfa7527bb90e5bf95ee234a765b24bd0dd27c287a3a23be0a +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..37359e094babcf685e8ab741e1df7a57875fed94 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/2.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c074477ce51341c06f6c3c9d2ae62d06f81634e50f70a4fc5344ddf016c67daf +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/2.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/2.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..75308b771d38b5d5e4feaed3545db4695872521f --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/2.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed5d90beedcd7385ba96fd4d1b45bca1a71da7b942979b85ef3c717533aa2d3 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd7c0854bfa663341b14cf45df086cf9d17911fb --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92b820f8ec63d0513cae35b299c7fcd3f0ff4302e4926720694495274620f5a +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4c50c3b4aefb495fd292532df5fbc0e3c06e51 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51deed6b0c7b96b5ca8479157135315c81d961b44cafb299f0527b77a9b852df +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f6635adff0060fc31c4cd90875bc58207885845 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/20.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc523a434c943137b8536cfd3e03a9609579e32087556e3ac7586638296ee81 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/20.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/20.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..238336a5a7eb71ca7776793ecda2ecfc636da2ae --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/20.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a607bf99f86ac7955cb260462ef3e16cd4b484d3ddb652d88ab9782598f3c695 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea62d63ce2a3ca7b6bfe35a5fbe792093c04ef --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45333cd6a123a52b10ac1e66858a0fcbcd14789b2068f9c98ad55a5ddda4c289 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d406eb3979f354d4abfbef3ef3e2bbc4032024 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ff2ae86b7314aa293981e0429987e08be4d0db9dcb8844c47cbae0d9c2e21c +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e17c8258705de4a71605e27bda652121d856a33 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/21.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffc91f43681f4f8c376e3e6e23aa46d7fc9347d42fd4b2d9b6f60d2a5b320d6 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/21.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/21.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..30cc6e3bc75dc5a05beeba0d4839a3eee35fd2f0 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/21.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145d2087fb63162c3f7776cb19391291c154e533ac80e4b90e49cf5cc4e3b721 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..298d49123c61e186a5a45bba560244f3a7d4739b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f8401936dd2027e71989a0948f9c2096147a1be72d9ead7dec2ea93cfae6c48 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8b4eee3617a0d374c7a6c8dcfdd449a1931be8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f6c267a49692c27c58fe6e288fee1545478cede15ac0f3fba314cd05f6d744 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..14cd4f4da46386f39581621901a98448a2029ba8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/22.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93aaaffe562edbd662ae88eb2ff721c8b4199c6ca51ddf3ce7b4483d67049b5 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/22.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/22.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..d860a012d503075cfe98f63af5495b09fcbdaeb1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/22.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b1065f2e88df63a9ab3ae2ad46b6dfea1aab45b5185af10936d80227a99a1e +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/23.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/23.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a6162b1c41f6a4d35da9cffde694c18a1059353 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/23.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91039d44337ed5ff671311653204858d8ab8dd115ac470e4426df74633df7cf +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/23.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2285a79278d0f56eaf6558a751f402b43ebd81 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505ca3348cab3615514a279e5f83c995dc94e26322ea661beeccdda808ee7875 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/23.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca9cf6a6b3a6a41ad2b9ef2c03ffcca7dca31634 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba0afb53af31cb64087baef1c64331f111bd9c579fb048cb690f1020ccb0b02 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/23.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f3b52136f5b1f81ef44309e905bbb53139a4fe --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d888cfccf5c49478edd9fd6223271d37c67d4a7228e8a11c0a2e475868c07c +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/23.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee03e1ab530a6a6b3e19b53699decf37e2e46ae --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/23.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8840938fe4b955ffcc633d39e13060254212f34892eb27692a33a3cd2c97b8a +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa53908978b04462c266bc6dad39c18d232a3ac --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1fdc6fb7828d84d2fa29cbaeacbb0cf879e2ee64cf7dc3a582d888d0e2dfd5a +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e6a727d6aa09c5b520808bf4c3f3c3a4b6f8a8a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ea45af41949b4da50bf2f5b26b6d4e981fe0ecd7121cd0d2680c0b65c7e1d2 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..21d626c758d25c800e53f66cdb4cb33f924c8f0b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/24.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43e090a9d03529aa50514440ab5338831c480ed63eb5386e56640afe78487e3 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/24.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/24.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..96176bda5f0cc4bd7c9e761d9777f448dc68cf30 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/24.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd8b403f731ddd9cfea80deeb02ec9c52be50734e0d27e6a74f1d7f9e6ce2221 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc392d201c0b3b6a151bade27b4aab920c049e5d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fcab01979a923fed71a475dc1b22cc5c0819f22885509ed4d6f2a625c87412 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ba060975887b63f2511dfb127498c9a2069696 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec29fe8dd7cf872d6dcbe182614c947f32fd75b852cd5a131610af68040e2d9d +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cd7b795749aaee8fbfba0d1741815bfd25b34c3 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/25.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175a9f13ab64719190a519bbe96eb55dea7c5a914bbea437da13a8f1ef80a179 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/25.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/25.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..009617d1d4528c0e19d58ac05a3b059e129f62ec --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/25.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c1d68520783fb7f2f7334e99b273b65ac978184675ca0c9f0540d56228f751 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..42e9296afd2e21488874df6cb6449a5ed6ed86b8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa06e0ce5dd79c251601a5ea7477640ee868349636c8ca9b42f1f6a66ecf363 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fd480cd27b2eb2c2db67ff4db7f93953ebb9e0 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1248ff8861cea206407051a92c42fe8bc2d811f17f2243a33ce664a8ec22fbf4 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab492b4e5b2c2c2126a2e8b76e722ee27ef384f --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/26.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae91a87dedc56efd10c227a4c4e36e95c3a558219a22a33b0ac2eee3dac504d +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/26.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/26.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..30912b6460090357057443870dfb12064b182014 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/26.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7857d3897a075c3ede40072f6648e039d1ce228bb847bd282b93a8c3ac9360f8 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/27.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/27.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3fdf1ce31db12192f3b4b447ff6658e6bce2d61 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/27.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf826dce4c742062c035730c27beef141de6fccc9a8cf0c80378f1bcdafbe1a +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/27.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c4d69c55d2b6a7737628dbac808801272bb02df --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5627f8ab0d5f294ebb81979527e55aadac1625af9e6b8786054f488c140d1443 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/27.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4feb58e7d00fb490c1b8d382089909daffd2bd9b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39b7cbc96fba4a8fd3f0e021b910d946623840b6d459aef72569aaeee588a02 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/27.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..439c728be2b9008254a1a0cb01a5048b87fbe4d1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52eacab4855e0869199c62e8f3abb14064636ce51b8ddcbad4df92a5a2022062 +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/27.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b9286170de1251bb1e9e7b0144e16a5cdc11212 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/27.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d368ad42e281cab966c3ca40eee6b933daceb46e45462bb725bf2d6aeff69cef +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a69f2eec2d3402f230de045c497b4263280be18 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9e82b6e4fa81d262f4180a198ab88eaf2d797f534e6057a7fc39fd579fd4f1 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..6742d772f427efa27f2c66285a86fa9d34ded8f8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72c8ab1952b87b7a75d71f94d78d8ca32c6d393cbbc1b0f8c4924adcb829517 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7a092b751a2c8400f7b2e08dbd5300aa1562e3e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/28.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7652a646e9d5271f8aba62bd3a011d8f18e0121e9d8d9e86e51069e598e2e90 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/28.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/28.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..3299fd12d8ba00273dcf54888258cb5ad9969081 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/28.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81fe23264c2a187c154f70bb963acefc52f02c36bb5a539a66deab7ce12438b +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..e10db07f91b837d10b26bbb9e2385c2b0a41e5a1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6fe1cc6304aacaed20c35277a757c933e5dd9bdd6d113bef655522c56311c11 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..43df50ce0136b01bb2e82ab64e1354b59edc2b7d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9b1d5ac534611c5e7470bbf53faf8a6b117bd4d4596077ee3656cd958cb564 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0ad9f05a8108cafa7b65bea4f1c42319765b3f4 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/29.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819d65bddf6680367188bbfd4507d97821a097a3a97533e9764f34b36f707527 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/29.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/29.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..220b71b3f0ec28dc6ff29b89ce8f4615753302bc --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/29.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e866af54d7d57c0ba9ab50cf8cafc29bc175400f6d3456bd140bd253b387b408 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/3.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/3.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa94e4de12db07c7707040df7a7a13568f2dc2a9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/3.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b07a3ccfa01ee8c11efcdd4b9996bd45c17c10330821af1ac35223fcc24cafc1 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/3.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..73d5f8634ea42355a8c57c45a3f13c485eb67774 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a092e687f3c6b68b76aa86c94e2347eeeeda67a39f5706e0a24544a11b1cdf1f +size 2196429 diff --git a/checkpoints/Qwen3.5-35B-A3B/3.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..975e19a1b6cb18b52a166f24b68a63bf2f4eea4c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e9b30792b23db017933aabed2776e17b6a918af34f34ddb02d173b3450030f +size 17167309 diff --git a/checkpoints/Qwen3.5-35B-A3B/3.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4ac64bc486bf9734bb7269fb9827a5c8c12e91 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee55ba6a3d45da2848ef8ba4780ce6b5633c9265194795fffac7bde50964ff88 +size 34145229 diff --git a/checkpoints/Qwen3.5-35B-A3B/3.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a018209f1f839fbaed4a7600189bec3264ccf837 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/3.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee34fe4e7bb7942f6aa1dd4aac175ab75ccaf9699687e3059a28edfd3ce3b105 +size 2196429 diff --git a/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65a7e3762e631957f41135c16b91b8d567e44f1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ccd97f61092d08b4e9970a2d3983dd91cc9870c6ec10887a5bbe697b5a03c6 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..03980bd5a2fc64c27c5af6bd9aac4538f8feff9e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb32b3bd71de6a8a3c7e472bc166b2ec45b91a1361c0d5c057f999e3ba6e24e2 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e378c268e59369833753b3f6190793ab9827f836 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/30.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0888c4910709ebede07b3c3e35676206509286b6ce46999cb78118464ec51d27 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/30.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/30.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..24677da92565d9dce238c6fd992cdf686044a00d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/30.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99885b7d778250f3a4acafd9804f1074d6ff27e32d805e9c1644cc6571d9584b +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/31.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/31.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d5442539ec3f066ee4adcaa8bc29a740e89c42a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/31.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ccc79ccebe0a43440279e13e7b11b14f00728da0111e45aba754a2222b383c +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/31.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6abe1abf91153d21db0312f2a9d0701a9efb783 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f1bed2c9224414532d107c08f054f008ca9bb31087fb7b8a81929d28879f02d +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/31.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad293c69a8ba4822c3ccee894b4ebcbe479df79d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5416851fd22632df8e1a6d6239f80815858d301c0932c6a9a5dc00ffead92c +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/31.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c25967fe4bb0d02d24453691f30b710ef2b6662 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa219545b878405bcfc24dffe3a7d47dda55fab14abe642922caec0671f6967 +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/31.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d21f042e2fb59d9879c363bc8667a5cf5c7d1b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/31.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dac3be2ad5e15c41121f894142f64d9add0b9e6ed5fb298f105736344010ecc +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5f7a0096a7e021b6872fcdd6b6607c651ec906 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8b3637ae4c3e907b39edf98dc9d3abea244df126502982575cdaea54772034 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..12fcd65e92ecc36bc3e9c8a5299a604a27267e61 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4030b81db5328e84a20673178f8334ec3cf0006f06a44622262500a246c86ad7 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4061ad36f81895335898868ca396c563472d81 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/32.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823563c92982b871e44f4f2624eb58224ce2b50921d39cbd4d430e92b91b1367 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/32.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/32.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a07ea1c9de4aae27480e6383b610b3fc5b02897 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/32.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8bfc570b342739c65405d1ed6527fda61d8b1ca7e3f447e0da79d773ee48e38 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a5b8f29d957508b49feed45b016666ef0ffda2b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd76a4b468abf3eae49b92598db81b3dbb00679f47036e47de0e813dbd53292f +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4c5238cd1fdb5745eb99d852db6b04e57a5eca --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9e9b442a06cbfedb548226e9584cc0ef9c68b1980d5429bde5622346af8320 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1855e4030ebb713ab358aa27354b2ff69ee1862 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/33.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc057b59c7673c73c1c958cfe9c85a8c1043fa3db65c77cbc9b780015331b8a +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/33.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/33.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9884f5147092dd1ba9679ae5d112fbc1432540 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/33.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f934be9d80ce94a8ab5ad085b75a0c2a0cf65abe35b18b1253541b7cba945e1b +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b27d493d168953325cc53f5eaab156b4f7b43e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d79734a1d3d47c6f2605957fcfe7efac119fd3260aa741cc6902da4656c7878e +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5911f9c6dae4002adc91975423c65b9034988c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0daf1505ab65fa0420ca0aa666acf76127b07a120c60718cc467261b7d031706 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90c1eb8e4ae90fe6d17f7473026a3422c7ba6b6 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/34.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb6c5f56f4a5722ba2bab98ca49c35e227fa285e2be45fdf916af2c592a5bf1 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/34.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/34.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4cf1c1bfd8e24a3ee83297af2cb5e153898292 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/34.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816c54fe2997804f6e73f60e21a026fced8192cdb4394d3e81b719231d2d5033 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/35.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/35.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..62dce538074adb6edbeeb7e879187d97ec6756b8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/35.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b8a7d0423a9ae0aed12ba5b1c535cf44153b6f2cb40941ff56abea3f4785b0 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/35.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..daec10a6edb47e2ccf1a55e9a3e99650ff6525f4 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6104172ee87e6ec600b39a2b9d9833e5c500061a0fd933c895779027818aac +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/35.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbf7864423a9f654672d9afca133d4ff0e242a83 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f978cec7871e340f3fb95f331323a697fdcb7ccf17673ff13eee3d3333c15a9 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/35.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb67c199d961447f58428b4e3991e92e1204b32d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12410f60b6eb2d088e7b75edcc02fe6efc9c1e1f2341f0f98003ebe6fa9ac01e +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/35.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa39b68063dd8f54461ccecdb1e404ef62c8ce5 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/35.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a57dcf6be0da3da27fa8a6b8099b11389d1010917ece3bb7ca3a267f18d5d6 +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..16414f042ff9b7718121f333fc910ed95f7eb04b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e886b720ff47c40cddf4e5fd3dfb3c3b495390c70b2cfbd4f1a41c9742dc64 +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..e989aa53fe8deb13602f819a143c941b210d711e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9067caf8bcd10dee32495333a2ebb9eee246070093518db2c3434f34bd1ae668 +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4bc257a74509e601b8b9891174d5b419be0c846 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/36.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f260b75fff08ed50a7c87bb72fcfdb99ae542ddd0b76e8d7cc28879e1733be72 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/36.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/36.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..b929f9e06d204a58b8d68bae8fdd4a18384b7083 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/36.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6308fa76388e840a9767697673d66b18a39e18ee219540f43fdbc15fcf2aa8 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfe6c3372525ee06f05549718a68d2fd3da5bd9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf738ab65efb57dc0a07cbb5ff90d6cdc0f88da8af83876364e806b4c5df595a +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..8795dcbc03a463de554946fa5e6da27bbd2b99a7 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96189070723f7868865716ced0ff0a971857536c1aa00baf8f0131197159eb7c +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3399a68cf5a542bc464521c9136c80d79d481c2b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/37.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7b292171f7c639706bbc2765303f0dabf0caaf62c91696fb62b2804811cc84 +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/37.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/37.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..f42be1004b3b863ef3e84703cd47b332f52d04ad --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/37.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e8605ff924c4283a8c9dbea75ff6eca6a008a3ec548542b8a15a9eb3afca18d +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4febd20d473f55a867c6ca2253fef1e8542c23b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731a1376f58dbff456d7f036029f8965032bf68fa952b95aa907b69ba63c0eef +size 34145445 diff --git a/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde5b5a219fb859c46ed60d35dd62023486a744b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770a1d3b87921fc4b6b1e0ed76184df43e34c80f4fffa90986ec2e06ffbaab9e +size 17106047 diff --git a/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd264058cc3d6778c1a3c7a0bed972f43f4bd38b --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/38.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e2cd3ff2df0f561d43286f72407d4d2ea3c177dbc77e87e7cb8fbc92065c5aa +size 17167468 diff --git a/checkpoints/Qwen3.5-35B-A3B/38.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/38.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..d76b70460151f7a65a4563e88d2e84160aec7903 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/38.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32102760579c28d8a89df1858af6002c23999602d8ea3854178bd43f63068987 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/39.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/39.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..2573fa436993c4dd2fd611f990dabc60bb5fa8e1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/39.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d038c26417d891b4097af7cb9780bd1d7e588dc2d7cf4198ce04598595e23256 +size 1635863273 diff --git a/checkpoints/Qwen3.5-35B-A3B/39.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7af9fbffb214bfc2dc672b01940e48086048b6f6 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52c34b3fb2fa1c2726191f455a7de7e6e7eb7f0577da07921632a16485cc9ac +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/39.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f4c1a9e7ead54de88d7afd4678218ac89dd063 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bda5194431cacdcfe178d1d4e0d9b0cb90a6497b433ff0dca20b163fac24fa4 +size 17167328 diff --git a/checkpoints/Qwen3.5-35B-A3B/39.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f770b28283a70c1cfd75cda6ad6eb98fd58fae4 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662ba925ead7c40b26d559997389c66309999973bf0017b8285595fbc90e8c5a +size 34145248 diff --git a/checkpoints/Qwen3.5-35B-A3B/39.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c300f5a0f200aed94843f0f519ce12a36aad97c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/39.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5daec44b50ffead19580578c56530959a46f56c6e0745212c0039082fe6d9f5d +size 2196448 diff --git a/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..83bbf5df5dc98aa71dec14b90f15cd8e74331ad8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edae6429ca5474a983aa6df6212877db948271ab3c35d89081740827ef506566 +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..acbb8cb242db004427ffcbcd445bae623ab67300 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5a4d6ca71fa8ab0934dcb4aeb9d3ea27da18b7f91d5e646eddb89c88230cc7 +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1341baa2154a3686092454316e077e2c05b32ec5 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/4.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b326dbb4f7ebaf5947e92d4c20caf6b1d6c4c5510444eabe046cb86eecee63a4 +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/4.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/4.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..b928a1b1817cfe6d0b6a3217cf3ddfd665cd4bef --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/4.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655221d26cc4049f9af60b1c3d707d26051cfdffc4794c1b050e86301343d4d0 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..300460f2ecafacbb2b1d0d80757970afab9d7deb --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64a9cd84844ffdaa2f0716f487df1d6ce11ac639a61430e1ab648c7f9bc6974 +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dcdcda06ea20ed772d6a4b2d8c13bbb27a0fc3e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01873c6a5b42a5bb0649a252e9a19d334d4fb2088d8b3e1e3104a41df8984dd2 +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4033fc5bede40e7f8026f4a6019d8625959751 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/5.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d90b6df42d541a75ee0ee31db97f79844e2eb40eeab71163af3f55a979806b4a +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/5.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/5.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..299e59040d356db518e2153a406a552a8175617e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/5.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27ba8558da5bc303795d12423d746153b057009534360229d2913141d64aa95 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..70309a8e9f7d307d42057c8bd6a5a65ff997791e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:595e1c0546139f8de582de77b82ebfa5664d0bd27a507f3f3bc2c6abd6c82c9e +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..e95ffc627944470d97364660bfc890080dd3d5d0 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c30c8747b9affcbea633c5bc413d1c41d5f743777f9965b1c87f1fc03068c2a +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b461d160405960aa11aa1cfc4a2ba192e6c1d9f9 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/6.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:471c575dba377724facf611fc01b9a018aec10120485dbc495accf72b085ad3b +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/6.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/6.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..1799a74adc8bb59ff1a2310d2f2e7b0a02a7d199 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/6.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc2fe51259a94795b80403bdd829ecf3717a3cce0eb988cf9c4655385d971070 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/7.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/7.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..364e6d7f919303de8f21ce481786721b564aefc1 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/7.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e6f3c56fd50897ef0ce07e73448d119455d3753cccd3eb91dd06ccb0901ae7 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/7.self_attn.k_proj.pt b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..569033af857fae93839470aeb2a4ab2c8813284c --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf2ca630285f6fbf8547643890150a4bbb6146458481d37b532b381f89aed5d +size 2196429 diff --git a/checkpoints/Qwen3.5-35B-A3B/7.self_attn.o_proj.pt b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f883fd2313f2790577e5bcb209236e298bcb15e --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ace39e1ddd14969fb17e02767c1ba0d5f3a9036d93fb1a1a6a4ea792fbd1eb +size 17167309 diff --git a/checkpoints/Qwen3.5-35B-A3B/7.self_attn.q_proj.pt b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..debda6360427590ce604f1cb01c5ed074ff75124 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b03ba21d1e7c6cfa4b6f9a2313193cb1cdce31c0c59629faf3857fa06c3038 +size 34145229 diff --git a/checkpoints/Qwen3.5-35B-A3B/7.self_attn.v_proj.pt b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..87574d40b9b17f3cf0cefea93a7d9129418d089a --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/7.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92045ac9c7f1c1be8a6f22308b246cd6f491b4e5a21a50aa374f85a658404222 +size 2196429 diff --git a/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c50b0699b7381a8d907498f5c60fc08face1107 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ac859f2c1608483cf26c6757451922b3e09466b05dcc9b5eb4f750ca8ad85a +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..52ecceb4187ecbaa1d479bd1ec3f21f548b5c91d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:592bddb5144ec58e2c4f542739ac88b3dad4ecea433cda1bcc24e96e45de617a +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8593ada6b77032034bb434895981bbc28cb98582 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/8.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87eee0354578aa0ed27bb54e54c691abd510551d649c077cfe32a759b3f9bee2 +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/8.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/8.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..f500e8a529a5a55919d98304632e0385ff948def --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/8.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:772a98458f6485a61d677e15186bd6a7a5911b7a9af8a3c6df30dbabed16f236 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_qkv.pt b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_qkv.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb53b787b8fec6f37b1737f1a373a554c66c0736 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_qkv.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db91f6f52921236605be94bb3d4a3344aead6e76887eeb78ab14997726f07e5 +size 34145426 diff --git a/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_z.pt b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_z.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f2f3446c087ec32e545781b193d298eec0448d --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.in_proj_z.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03bddff4a85f28d674189c9985fa5fce357e18361c3ad451506aecf71e609c46 +size 17106028 diff --git a/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.out_proj.pt b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.out_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f3dc189106ce7edd8bfefacedab31b907065451 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/9.linear_attn.out_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc057b3d91263af3debe43c7b9c2e5520eab4ecac3bf7cd619969bcaec7cf2e +size 17167449 diff --git a/checkpoints/Qwen3.5-35B-A3B/9.mlp.experts.pt b/checkpoints/Qwen3.5-35B-A3B/9.mlp.experts.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f05e0aa924f8079c79bf240a16362a2cccb3ea --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/9.mlp.experts.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61599f3fedf1dcd5c791123936cab18e2416a718a2533db27f0cd54b0564ba7 +size 1635863244 diff --git a/checkpoints/Qwen3.5-35B-A3B/args.json b/checkpoints/Qwen3.5-35B-A3B/args.json new file mode 100644 index 0000000000000000000000000000000000000000..fececd7c4d489df94d174ebe302d9304e43428a8 --- /dev/null +++ b/checkpoints/Qwen3.5-35B-A3B/args.json @@ -0,0 +1,48 @@ +{ + "model": "Qwen/Qwen3.5-35B-A3B", + "params": [ + "channel_scales:0.05,angles:0.05", + "weight:1e-5,quantizer:1e-6" + ], + "epochs": [ + 3, + 3 + ], + "weight_decay": 0.01, + "betas": [ + 0.9, + 0.95 + ], + "eps": 1e-10, + "loss": "smooth_l1", + "group_size": 128, + "n_bit": 4, + "num_rotations": 8, + "skipped_modules": [ + "mlp.gate", + "mlp.shared_expert_gate", + "mlp.shared_expert.up_proj", + "mlp.shared_expert.gate_proj", + "mlp.shared_expert.down_proj", + "linear_attn.in_proj_a", + "linear_attn.in_proj_b" + ], + "datasets": [ + "wikitext2", + "c4", + "redpajama" + ], + "val_dataset": "pileval", + "train_size": 2048, + "validation_size": 64, + "batch_size": 16, + "val_batch_size": null, + "gradient_accumulation_steps": 1, + "seqlen": 2048, + "cache_shards": 1, + "output_dir": "./output", + "resume": true, + "checkpointing": false, + "seed": 0, + "use_wandb": true +} \ No newline at end of file