diff --git a/checkpoints/Qwen3-1.7B/0.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/0.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ce4e2e99183df9a69693b3b98ecb4678042924 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc5d6defd5930405d8d48e88f72594bbef7cc237d4a5074f1d3e25412a8d06a +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/0.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/0.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..033908bb6c11202fe2c94e031f1fa393f1203fca --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb452e2e85b52fb99e276e531cbdf8fa8187808f910429d01c5c55c879793237 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/0.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/0.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf545c0ff1199317de31ed1c73f5d57f4ad4b44 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef27cc0e3b984396b7390c076e7f259be08f32a3f6d49c6d0fb087c296aa664a +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/0.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/0.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..018826c8e52b3752ed7199ea33f2aefee8b48c78 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d17620c5cf668960ca66963c4fa98292b1489972835daf83a7be95c74f0ff76 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/0.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/0.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4271d33ad16b09290165f4b90a29c0c74028ffbc --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e707a4f17780a149c09b07cd7659113a1ff138a6e70fde7921de8ba446faf9d3 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/0.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/0.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4ea5c33b797a961204543563703635e235c524 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f750c350f44ac3da0ed754ba12fee795491f270ed18c48c847a6b7bd23fa75f +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/0.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/0.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c2f523dddb78d39cb658c833ccc7858f754673 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/0.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6815c70b3bc171d5d919d428dd627cc3ff619423f3061b32bcf84c2c320be5 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/1.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/1.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e7fca6159b129338409f46d527ef2690b5024fd --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3416cd9251b6beb26606d127fd65cd79168972cd98d016418f38f38dfda576e1 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/1.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/1.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f27d556849dac12d12ed0763aaebfe1ded497b0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecf068df6555b637e58042023e400c637ed7cdc1ace6d4888cd20e9c0c4cb2d +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/1.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/1.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87708403926e38d77ec465cb536cbc811e97c48 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f4d22176ced249b36ab3603e8f6f117c88bec8c2e907eefa65d600b44a3c52 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/1.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/1.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c73238bfc631b3cd3ccb2327da76b9ad6d5b07a --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce01161a1366bbfcdd2cbc6d8f6d9ac18060887026235619319027935599d9c2 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/1.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/1.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..afcc1f3ef8cd2b80a42532d643587b75905403f6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f291c4f60f47e411be31b2fadce1291632cf58aadcc692a003c49577d6c2084a +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/1.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/1.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d2d49b509a57bdcf4444023227f3cabc1daed43 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8749b5520121d45c37a57e894f0bdec0b859d853daf66cfca33d52368c7a1fb +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/1.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/1.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f554abe1f85250e0b164825a5898d8592e34aef6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/1.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e68f261da8194a1487a0b49046bbcd8347ebfa0d26011f56ee7620aca14660 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/10.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/10.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..423d13030ac5863c55d48b90f55d0f854c2d9048 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46b6db844747cc117441a22582784b7a777f2649870a608eeb4c953e708fa9c +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/10.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/10.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4980d512ab9250dc6dfea5b4c93aaf4d1bcd6a36 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7f8077ba200bed3edb1b3efb757279e05b1cc82b52911ae596fc02de3835c3 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/10.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/10.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c14ab854e10bbc62cb5c6ef5187548fc6c508241 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bdcd289ac879100973b9e4e9edf3657c0697acb9adfdd4c354ecd33abe89970 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/10.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/10.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e0949914bfed98b299c009adc725d1d6cad38cf --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a96de98aceac9a973881625f15d0df8eeee4c8a4ce2fb91648a4b53540f0228d +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/10.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/10.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e0e203773642a0c12a867e7d3c946dc18c7e72 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf420c7886299e22db1f8f0ebe0cd00844ce82663218c08b492635895302937 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/10.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/10.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d35a86f8be43d8c29003bfb8aef372e1c3bf749 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4bb4f16aa549bc27bc10e8a10b2b4d6b9a1f0bbc90f511727d8cd84f86492dc +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/10.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/10.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..56073cbe82c108c615a971613274e53cb43349b4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/10.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6953460d6bb3787c833222229ffd958e71e217605c0d736864a1db57f27eee23 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/11.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/11.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a07396ec24fd4029e39b1490b2cf58f3c7d9376 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3e841f0ced35ba18bf42b5db3e56414071b229152373880396fb4d57f6d58b +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/11.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/11.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b538d284451b39b7c4fd2a93d79a600ef6c8628 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d7414a0151351da76fcd664870248529ecf7cc95d42cc8544a8bfc13c9b037 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/11.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/11.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..36958fcb37ebdaaa64329480b0ed384a7f7eb3ab --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce0d0439f730795cae43d3692a26940ff6cc3b5a80a308183549574e1371617 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/11.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/11.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d6f15d6e13f88e01fc699e845eb4b8652051ca --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb99ee04d58571eb9137918bcdd23138b60fffcfbc835d11413a71e1393163d0 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/11.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/11.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..198410c562225b062bda9fd79779468e8dad5689 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de02b45b9c3a6b275be3ba9364baada4546cdcf71cc2e940bdd7d0e1a2f40e6 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/11.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/11.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..315b3a7102c5f92983c1d7723ee6ce340d4f1638 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcda8c078755cafb8aae6e6bb82baa87f880672c6947c78a33daaa1a75acf845 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/11.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/11.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81f25316bf790b67ac026aadf64a7c9b42aa3ce --- /dev/null +++ b/checkpoints/Qwen3-1.7B/11.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21108b9550a45d0372c5ffba00900c736612cd58befab5dc048283ecae8a2b53 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/12.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/12.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..556760dc1a6d62dd864e83a9a256c790eabf1ac2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65e51fa13fd926ef9d8d1adf3a28fcc8edc91fb885f5a619e9f4e58250413e0 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/12.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/12.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..43844330a4bcb4631b29bad0c745723d7bbb4aa5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232ec215eb7d15de9514bc3d8cc39b7de134973c6b09d3d8797a721627846480 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/12.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/12.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..37f18e70a1511978a63c5f8ed11d8e19d08fd400 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346e29f06f7875f6ab27eb15b9d28c84fb7286cb4889b3eadd872eadc38fd046 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/12.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/12.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a50f91bbea4798dff8692b118e92b3245b70aa --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f50df573e3b34698a2d17f801d2c2dcb48eb1ed8b4a92b2d4cb383d4ccfa07 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/12.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/12.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9afee21bcdde79d5260aa30ca67350d2148a0eb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a27d55232dcfa6084292ceba266637f549762ffe432e6bf8308aea670ea17b +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/12.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/12.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a6f9b503ddb53ad1bc908437d429d011fb4a954 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fb2a88eaaee15f4fb0d67a40f0aa0719b3a6ab35cee44561109b70a4f3a1d3 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/12.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/12.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ba8ac0378cc5284e39509e99682b1c2d1c7d2b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/12.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1faafac62934ce22a3d990a2af5e2df7b10adfc31dd061c7daaceeae53033a6 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/13.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/13.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1079a2dd1e06aefde00e157d11ed4ef5c2abf70 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef98d83e35352d8d4ffe4753bfb3fb9eb4d9785af787ee9274c06b99a0ff2e80 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/13.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/13.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..32737dab1fbfd5a042247b8560a5c6ad73e3698c --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863fa792df15d212a917c69a256dacdef24bca21be2cb94909195e83d9e9102c +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/13.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/13.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b60abf4431f527d337e1c1d9f5a5626d9f3e474 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860f719bff538cb233a6e6843b2ee94be2b40570b150641929aa7072ec558c38 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/13.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/13.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1e29c57024d4ec8b2367ecc7b6cf6518a6f839 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a6b234b0e3bc09b10ff870950d6f9587107b5f9e847ae00c080ccce4db6d67 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/13.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/13.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..625ec52c3e9e0569a29fd28ab068dea715f75ef1 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aceeda9f3c26647ac436438395a10c3e8b603106f3baa21ac027ed4a3f594975 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/13.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/13.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c6f6078e7f6e532ee26b2743d4d0ca2bd8e98f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eec2a4b918c26d8117f24dccf273c36d7f51e1f311d1ffe7653bf310bf5ff28 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/13.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/13.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..067e0696ded8f883a359767c7646f8817b016c03 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/13.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df436fb13551cb313b349df87dd5192891e4d365752e0083a90d994f75f9e300 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/14.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/14.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3e75fb06603a73a18e30bc8ccc49a9506e8a65 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8653b407aef7e98edce01b77f1fc3bee149efb6c27f5ab2c35186939f013dfc6 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/14.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/14.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c94e6bc9e8d87a01958c78bdb660334b711e7395 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee4849052cb8e79144303e5f37cd697ef0687e7b4323d6f9b610a336105d692 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/14.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/14.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..761c3d3b4f80ff400aa1ccc5150672f41a0d58d0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354a2187d21c8f5944a40ee01c4a2a5b3e32c1ac8fe041e2b16855ef3e280025 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/14.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/14.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ef43d80aa018e09b50dc9477211b5533408ec1 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:768b95f0ade2e8099a770ff3d6ca1cec78b9f36b56ae7c11875b16db0721d3b9 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/14.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/14.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb610d9c8cfc4af0ed0ffb73edda9af65168fe7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def39d65cbf014e4bde3da7ca52112d6c0ed8c3f05213e583febd77d1b7334a5 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/14.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/14.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9202e552ba5eb3bf4dbf83c5b40d8090617433 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab462f6b170cf1cb12d91dcc08732f159740fb9293ab075d77b2c95bd3e4d98 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/14.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/14.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9fda6440abf3db4e1ad6063d02c846b79938a42 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/14.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b30f6635e38389f9bb9c8c5b256232bd371a75c961012deceac18b49d9190c4a +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/15.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/15.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..72fae1d375b8e75cc4fe6d17a632a27fdae4c4e4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1506c093ba9d736f68d9282533b3936b728f563a9658f61b896d7aab8e1153 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/15.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/15.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..69ad0db70c28db5308578285e4c9eb88b19703ac --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce30dbf4bd3323cb5b04d29969b7e3ca1b84a2056a7e47d93be2f17c1d60dbf +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/15.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/15.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfcfdef485c0b6863ce0e4a449188328ef3defb3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e726db33ac6ceac0918843bceff276e0bd11d1c324dc2bbcc3acb8cc6936404 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/15.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/15.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e9c8dee713ac1a4704d1b2fed4c43b9457b201 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370b08a14b7646522c2b6e69f9af8845e9b69e1781444e07018bd9e98f60e041 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/15.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/15.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5f3a3dd1d511159bc9a4101db30da620f13e66a --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e275808a3db55f0564596f9fff197ec452859e8dbb0330687645144f7ad8dcc7 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/15.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/15.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d86f3283bcdcaa2a841e32f341ad8ba7eabe63 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccd11566f111387916be3938007956110624b5f2e862457725397ad21e15bbd +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/15.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/15.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c6a0fd652048d0f427b8dc5a3334996fd55230 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/15.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984b8dd7fa1aaddabe819a3a8b39495809c395df2adf5ed9c172d7786a1caeef +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/16.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/16.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd0a23e2b6fe2e7ede67b8489195b083e0efa183 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2089c20ff9ae7ce44f0918946c788369c0cdd6f143825273409c107e5d41efe6 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/16.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/16.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c0b8089721fe6eab589cc0b5ed7252276b4374 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f78f751fa86a1d34a74ae4d4861ef571203a9d8fd52180c5579d317838ec28 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/16.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/16.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5984f68240dc969813d2eee3cead5f2939804edd --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01a432ac0d0a860ca612881deb5b510df6d585834014b9182a8af7a0defbf98 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/16.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/16.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ffbca449d54a419b2eea53a9d2162e6c1633f36 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44defd557ddc1b7485b8edf462bb386201df15ca7943ecd909930117643af6a1 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/16.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/16.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff6f2d95093c9e198b33c75aa3abbbb987b25aa --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780c65c032725e93fbc33cdbae45f561abb785a17a710345e639f23706571bdd +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/16.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/16.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..861f83fd5f4319f002a7cce254a943163061740b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61099848ba81672e64d582101bd1c5213f895b148e02f71ec0d4e23653af3dc +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/16.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/16.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf7ce41adcedd3a33e283c260e7a2134a9da9709 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/16.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6cc9994611c1ded33753ca472624e378fe1e7cfedd39beb9a69af463c4e916 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/17.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/17.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c194edf4c40c7c20e8d17d497ea8d5f762f2aa --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab621969cc9355eb9e50cc487db90a51d6f75b42ba32dc957509d2f65d43745 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/17.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/17.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b09b5065897a188c91bc3e99d9d61c00752a2c --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd88258a60eba2520e925bd39019d32daf0d31c776a01fe1c5db41d99c03774 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/17.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/17.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c42446f7faf573430831a1fbb4f858f33cab50 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da00e6357b0ed4c359ba766cfde37f3a6a4ef2c56de7310f00d68db45795d93d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/17.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/17.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..90e8377270029bd24f9372f44714cf06b08a4526 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77eef0f99fe0e2562524ff510762367a71047c15400ba6d3c08aa4c44d8cb0ac +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/17.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/17.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f428792dd6727866cc55ca064e0752eeafe88698 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11b575d74db4a308c1ef11bf4c67aa7ee8ce234c433582cbdfd5f25c5e2595e +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/17.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/17.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0ece308ad291dc5add64eca3bc1474733b2e53 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a12a23a56cbb620281879b9207a2c9ab3b614dc8cb23ddeb9767ad9291567167 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/17.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/17.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f586403f593c387201e925725785b3a49e6c2714 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/17.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d1feebb2c92748b670a697e87aaec83a7f792803961aacd070eae84affb04b +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/18.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/18.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..034a35f0cc05b88762ab4be77da889cb934d4d89 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b234d1d15f32f457f4b2311ac698622adaee07f315d7363abeacccd49f35ab38 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/18.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/18.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7cf38a409a42e345617f523afd92a16f52e39f4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05dc18a061f4c2147e8fbb29d7268a893e4984690abadceda55f36b52e0f1ff +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/18.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/18.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cd1711b4023bdd25dabddb0084bf697e502b754 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f2fb94cbbcddc08c9529389a1a7cda3f8a601cba42d938b81259e614f1411d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/18.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/18.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1709d8b4ca9be32425269d5c3ff544f5da87496e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27717b5597d0cfeeb3f29f0dea58ee226894cee488a7e5b7fd9b4b3926819a81 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/18.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/18.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ee2f2b74ca5d33057f654a33aac7ab759c54ecf --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff9f9e715cee60ff06992dbcfc4d98e9cb3fcf55b482d57432208629034e7d6 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/18.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/18.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71146ad0554c733bfe4d2a1fdb9c47a67a4aeb2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bbed19fd2406e9bc465f4d48a5499af1ecb032d2d90a352c824824084eb74ba +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/18.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/18.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..903da6c973667818a37d43ee912c98207da67c96 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/18.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6be89751ab3a67d4d95d9d06f9a4b9bcfef359cde13985437259b19b9bdda4 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/19.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/19.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7635fa3841b73590da2edb72acf1b4622fe2b1e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5664b14fecb6121092195a18da44d5ec741118dff76334500086cab9e409595f +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/19.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/19.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8024a22943f91c23f83e3bcba359f65b67ce9805 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26443ef31619629f7a291e987c2353339e7f1a5f4b0fe0f7aadb79a67120eccc +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/19.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/19.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..71006af763d3ba6973d4aa41dec54b3cad6432e1 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637fd76647ca34bd3a657c126f477c2bf7a33d6eaec3ef391b8fe522ac0f4457 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/19.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/19.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d4d4941c0200ac2b9f7d5ae1fa1d42330ebece --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b0b7b5e6f964a6181e59e8d7d6a3d9af5658410effbc9fa3ce26d8bf8429f0 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/19.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/19.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e26ffff85fbe3f2bc7eedf2b66ac3e939f22be2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca709da4cdf17e7256b91cb9838a3529ddcde3babaf378485500125eecb5eba +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/19.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/19.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8131e2a4a76b84e701f93ee6f15cacf4b6cc276 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89ad20f11c7a2e65f702171f384f6e37e3544112a8b3839fcae61e6745fbf90 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/19.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/19.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27c31d55253b3d300ed986c556d50786a77924f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/19.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49cfaebbf9f71fc1f0560b2cca442ff2863180a60c11052865d6c6b64a601f90 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/2.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/2.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6460e41f3847ac457183228a846fcd963bacfe8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7e225fbaf89fb9c6b76c74dbc2d42be75661bf5eeaa422f051e3917d41dc41 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/2.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/2.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..24a27fa1fcae98a9e50c064c90cd34b349670659 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6443c5ff0ca72b9947d4e5a9b6a9bd4f6cc4146b5d22fb02d5aaf44f3e1252 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/2.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/2.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..85faac6e3821f4e0544de9bc226f5b0006e96b90 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99aae0767bcb6e7e2fd5a4339629bb5dc882314e91e1612f1f681d66a56494fc +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/2.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/2.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..af52859c2b175791a2623d2891c54491b042f49b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e817f54f127143529df99222b78588cbf58ffd3782807d68cdb6ca54ee833ee5 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/2.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/2.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d49c3c9ae0e217a80c7b59c232af46ca4e5d08e6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c096089fa036bad5d801eebf557b9ccf5541663bf2644e98a775d7d48fe91f60 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/2.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/2.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b3904e7aa466f8bb2e1e687ac2bdd0fe0da0f7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb9f0b4416a30a2f34f06b15ada2472684518992ed6128319b38e438fc5cbb7 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/2.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/2.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a4c1b527967523e75c833edb159f36827eabc93 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/2.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2430f8b0df7138a06c6ce8c1662daf4b1f7d72129b3e4056809c9ec6dcabf9 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/20.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/20.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..727e8172adb9197b4d77f039795e2526d66aa3e1 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1629a186088389326d2b4f91243eacdb830fd62e72237ae2e374a302c622bc36 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/20.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/20.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ec556e9eb0617a29e7e0e6dccd56eeb234712a --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faff85ec384a4088e30da8f13d7ce58ad6e7e70d6ab9573ab72b338987260036 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/20.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/20.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2fe4aafe022d01b1c3ad8fe41e13a857b26c21 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6356f9675cebf1972cecf3b1c7e5f94e36e8a12e977cd3a61e8b0b99bdcb13b8 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/20.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/20.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9186954564579ab03264c45a4fc3235ca5dd91fa --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0dca0fa89c27fc2c58b8cb380f693b28dfebd2b11acda1b67bc509a62d9fec2 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/20.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/20.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9875d471ba9956ae234d861f6444750eba41b32 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc298a5f9b777f1bebcd499b54732192f493183f4776c18dab9ff1f39a56dcb +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/20.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/20.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..31af53f756b047b572ac52d309a6f4a53113f908 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b273688ba47047f292ab5248b3a3f965640bb26d2d97ba6c53bbbab390cc9a +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/20.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/20.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7121132a8a6d6ef87fccaecdfa44e9d3dcc5035 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/20.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65434d6641d22cb990d9e112650e33b10f99639564c97a7af58eb772631cbc7a +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/21.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/21.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee487ccf8ffa10bd4eb9c3b6bbcd9b82116afebb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:918015475ed15ccb3a63d29b022a1f45f98e4652ef5a3ca0e8a175b0a83edf40 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/21.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/21.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a402261b3ae97d480d9a80b55aac0195b043b8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7573ab03be955f743f874541cbb2c98d8c01dd3f7f026cafdc3ebeead618b863 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/21.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/21.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d146f430333941929cadcb731c82180cd7775e7d --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b67a82359da85bcfc8d1bd7ce554f20872ca55b21eaf04bb17278624cac741d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/21.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/21.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e519b437e6d3b70a36fa5c363e9aaf0e5484a29 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f09218cd2ec3823c1003ea8c9e58a6cb07ac550b3e7d71bd306babb195f89a6 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/21.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/21.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb04d012ca326828636efb25ca58afa0ce120bdb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80745dbfc2959edd7adf11e7e065d4c3f7911a7a7c574a90ea5cbee829a1a50d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/21.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/21.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b19e33e7bf02dcd91b5c6fed5b2692a1f37f51 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a9841ebc375d074133c37dda43087e83665aa6b1b55f821476cd2a70d607703 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/21.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/21.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6428721e47462c8c5f47a7474a63a96d3fad471e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/21.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0147c60ae64cbd2a62a408b8be4cbdfde0f23a0dd59922894d3957bc1f5a64d +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/22.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/22.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..580ba7b702cff8fcf6218ea37aff84ca0496a6cb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09827cf3cc344381b2239e07ef485e1cb88a92820c5d22d53a7a9d25fd5c3387 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/22.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/22.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b7c07d80bd3fb000ad33ea65dac83c51c5f38b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae88416c266309989f79ba1297318b383e88714188b04306856743efe6aea154 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/22.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/22.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0be78e780168d56a9f3448bbfe19937ad1ebd2a5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b23d5df7ce4eca32ebe3722b9bee7c91ed587523e1bb55b0df4d91cc5ae1dec +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/22.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/22.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85610d89e80d5fb3d9e476ebdccb2c4d5a0af26 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904428091fd89f216589406f40b12193aa1620ad3af73b147b2e2aebc9b57dd1 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/22.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/22.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7c0553036d11fec41b67f625b3001bec938b13 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520d22fb9f3b0f3ad43ffb73b0e104b350efdff54139843fe59e321b739bfcce +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/22.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/22.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a89d438539596d17cf5a41724a2cae96e33eb4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94301f68fb18b292a930c6f187c4e5769d0e23b03e7dd361b50c50eaecc89c43 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/22.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/22.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aa419e7174397f3eaa412e5c293d7e7aea04198 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/22.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88b2acf1accfcb095ab052836bcd6c2ec23060b6e5ece3114925134bced1f08 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/23.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/23.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e97addbb4f7fab1bfade199e60c4335145136fc4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2855c3f42d42e84c39b31684bc646045e5a576e4d1204943147d328a1a73daac +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/23.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/23.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3f0c8ac65b315b71a5c481d9b88f3911b75c8d0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b058a9adba529264a2f3594fe477cf2a5043ec49f0483259ab03f97053ff9e02 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/23.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/23.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ccfc365bfb5c0a638d8bcf7d1b18ad1ab248e7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9273752af081a73df1efa6d53e0e818c42d7359b2aef1a61f365564608df8c5f +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/23.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/23.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e8acbcad776a7487480164589ca0e26ac216fa --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d99f7cd89d49d7fbac232ad0af588031b7ea7b2ad8263041c5a553261be0bd8 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/23.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/23.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fbaacc3bb01abc6a6b398665d35807dc80061a3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74de4578e01b912cc1e332fd0512d77d88212f6742dd7b100678e86f3097dbe +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/23.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/23.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1b96ebd0ff7512665c4ee1b413afcee931e665 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a05aeafaf7d046ada0d855e20098b2938661fb722f62c805ed12e5cae2ab04 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/23.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/23.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4e2a72450679a800512330281c5d7ccce8a9517 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/23.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5ce3ccd740041fd19003d43b6ed2b4add445087c84b0b84d3bbb7f79cacc2c +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/24.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/24.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..613556a916e0b3b96dbc2c787e9419e9439b5927 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bdd6c0121d0299d552b9b87c1fc859aafc36e4d3775382c539e2326e689e74 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/24.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/24.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..992cb4ffbdb4e9a485087ff452cd2cdf3bcbaf6b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cefe45fdb8fd59a3bd665e42cb8eaa309339b74a9917a5a653feb9db54a3119 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/24.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/24.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e7a0183613d5662e5e4e861674996d6e8c02c7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5be65b742268d5aff720d929047d7382135d4d8f1793c34c4656728f89348ba +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/24.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/24.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f71ee597d8b1657ff043c7b05989058a908df8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b0dae571fb02b0b5761b5e9c0216b364a8201509907b7bb44d28ce4d175992 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/24.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/24.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c092b3f1819db3969903d9e98091e36c6b3114 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2baeb77cb77e6d1a6a4f1bc2e49fed4e28bf5bde918dbbcfac1b63ff113aef +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/24.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/24.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..45fbf8b8ea756c5fcf5220d418b1b28bd35eab90 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a303fb9399a7c6bb980345073015364cf09673ec5e8f45b40e0b743541e40ac5 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/24.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/24.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fed26d6d2779bed9ea7ef4db3c12679723dd49d --- /dev/null +++ b/checkpoints/Qwen3-1.7B/24.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb33b63954666f7e703611b53326ef47c342f9f9d77f129f9e8aa05d71d2fd81 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/25.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/25.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a5a2f6737f6ff8f48482024fa045d37a5104221 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfcbf1d29fc96030bf28a8112640b04ed9620c3b9271c56c87cb6bb5956741d4 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/25.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/25.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4302dc3aeae43afa4181e4cd70ef564b31d17641 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318d75c9aa9d09f031f7206a8c227b26e5cd81d44047ebc3a9704a62c2a1141c +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/25.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/25.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..656eba5837290405d5e0a5dd714c5ab40e0bfddb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35be7004d50c118b8a7f51db783f9d982175625df9cbc226bea74e56bb1f6b72 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/25.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/25.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2926c9abdacd907c58e689123aab7f90032c64b6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba74501e283548d50b5e1c0b8c70402eaffbb1f91a2d925f455d1dee206bc87a +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/25.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/25.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3f9dd2641da342afa3c45ba4592cf2f8b948ead --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:335016a7e2e96494d8d054cf10519e767ce55c9c29a54aba64709c2933322e1d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/25.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/25.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..300f4c03d9ea745ff15640020b7ec6398132c975 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd1a16a484914a13b0d2037a4a7f4fbf4b8ca6bc0e14d7afb3dfee57d71d266 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/25.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/25.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddb31984fd38c430ab880c8142e77291899e9c27 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/25.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56eed0b8f5bff63ff54a509f368378eef9a166171e2d1dfc98e5fc6dc0499f5f +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/26.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/26.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..299d56deafaadb00612ef5c51d257398980ef68e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b5fee87614e036f3ee08e1d98314ddd451ea738bf67daa33141bbc8e0b4ebb5 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/26.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/26.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39c5e5d4d4e68487ba3cfcd60a2bc3e03509f25 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f327d2a037778731034158c8efd65caffbf9b50076a80c7ab92968c13b4f31 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/26.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/26.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1703aca79ef1d2a8aed823313dfe8233accc9056 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1106421e1545675220321a5bc74518e1f5bc28f421c55fc07741457620a9473 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/26.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/26.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c28cfd2a73be94269835c4f8fd61bc9a948d4269 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8506d8e4f65a8ecc1e4277f58bb1f40ea6d3a9f166a11157050eb49c0785101d +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/26.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/26.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..473690295c59d8f1496faceaa387c7ee6a0357c5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dae9a1d2b7d63d5fdc5b87001bd4e5ec95d753ab02836427a03705aacbff445 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/26.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/26.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2697ce96dc14dca1aeeff82c4165ec37152db8b7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae5c4af753889f03802cf395771e4884c188349d1d5a5c5e7da7d722ec07f7ed +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/26.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/26.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f033bb0dabefc4debb1fbf1e732ed28272386107 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/26.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f72e297bda8942fc1fd0ff5dd3dd545bd3af590c6d404d455d27f26a1908db +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/27.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/27.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..50f23c6a8ce664a5f786b405a975f0060cae7309 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f8437d30bf6476bd041295477ab743325ff92f150b7b6c549493a96acebf3e +size 25748391 diff --git a/checkpoints/Qwen3-1.7B/27.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/27.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..11b74bddfa58d4f1d65fbf42502a9caea0ca421f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9318888113ff51faf9e8a2b1f2aeefa90ba61532fddd5a323a8bd2159c3a6db +size 25625511 diff --git a/checkpoints/Qwen3-1.7B/27.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/27.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3afa6b7945f88cdbd1fc44971e51f25797dba9ee --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5469428ba88acddf6d3859b602686dec59a5a8b194cd7d1fb25ff14b37a94330 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B/27.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/27.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..76999625e7c31937f479921af5efa05931cdffa8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff16c09afe759647879be7ebfc320108e4c2a4039316a8303c9251e181e8dff +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/27.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/27.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca588264352697357efc4d1b2c006450f6463ba --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4dc568582f5c5ff59fa3aee1e9b2d767f54c80ef314f72bbe4c9d3ca927710d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/27.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/27.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c39436887913d639f489f3a0f6e429ec51acfc97 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afb96a4fea0862b15814dd16ec27cd44965825f85b04dc6f6bbece44ee5132b +size 8586208 diff --git a/checkpoints/Qwen3-1.7B/27.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/27.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e7e7a7c093fbeea3c98c01b230fcc5bedeecee3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/27.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb40e28c073b20682caeb482743195c5539ea597bd197824bf786be661fcfa46 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B/3.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/3.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..64251300de27df7885441c21b83622d81216ac2d --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:483e59fa6857af11dcdd69d7f505b04a1689293852889432926282b56dacbe40 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/3.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/3.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..931128c9cf19df9afde61d05f50b2c276146a8ff --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c82ed28454aecc93654ccd2d2b33dd92d63245e6dd0c604c02f18cbf243c94 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/3.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/3.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e286f346b9aa36a8743a53f433e90f71f585fff --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9903727df0d9b5b0aedde9081b71d006d434e5228d658c7e028f9784310c0f23 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/3.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/3.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3458397cec4fde267aa7f8471d97cd29ea03ffdb --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e130b33018bf3a20011ae9f1e44a3275c8aa13c482441c4d96357bd28c4d97 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/3.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/3.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..26e584ecf070532518ed16f07d27fcc0489f5b54 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25dd97909cda07cd52c1e9df2aa5f417bf26bd212474e5f64b88379624913718 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/3.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/3.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6987873976797f16113086e1a3dd915e1bc524e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfdc66f3821761022c17c3cb540eb62de72efc72947410280e0ecab51577cfb4 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/3.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/3.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..675223947c2a722d721e5a395a8569506bd686b5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/3.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b94b334acbcc6d2fafdd732499ac00bac24c4adf0da1f6278a6ecf3684ec7ff5 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/4.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/4.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef2bf67acd1880c6924178ce5e321e7b0e16d9d --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8990713f28bfdf8d3423699be27926ad0e9ad531f7ed279cc4442303c8db8a +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/4.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/4.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e403017351c0fef4915f22b063ea948ea5a1b28b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0c207a2f44c2c1bccb6d586a490a6b2286a26feba591b82bcae16d895cd222 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/4.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/4.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b114d0b654ca1bd5e8b920c879b4dd38e8a91d2b --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccadf050319b64b7e8ae25c5b940d0e2c6e60b008de32a89b1e1226ecee087b +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/4.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/4.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc1eeefc4fb04ffbfc8e7830d58025ad209b9092 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37589ee0ce5167fc0a0744dfb71dbf62c305caf7b640e36d639a865f564fdd70 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/4.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/4.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d239193b7c49cce87c8eca59e47646ec1c13b3b0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bc01645a6eb26d46bebe2bc1e6adcee6c66b7101b1f2f3cf3842d423e820fd6 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/4.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/4.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..00be2dbc89d3b6d251a56cb3b399ec584a419712 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50c96c84085e610b9f8579037b8a169eab1be7945347afe4cf44eafde8ce0be +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/4.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/4.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a09a45acd3d8c2242b96801380cb529548e8e093 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/4.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a11e0fb75b7f1416af2f0eeb47b8c58a13a53c3c375d840f6466a366f91dada +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/5.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/5.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5455be30cde7dc6b29c6f6fdb84ef7092349575f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49c11a4d5736c50a2df881fe1fc732915b8ca710fc0cd77911898a8386d32975 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/5.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/5.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7142a0d8b9067921583a14a8e49a352726348af2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e41e629337ac86e8b0f74b2fd6f70fc3695483872cc7219e6461ded71e2c2b8 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/5.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/5.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1315a9f78e1692c7c2c4a86315bad9aee7fb2a51 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aece891f7f73065e854ff76b7d4419156af5d89fc072661d92bcad2aae50aa9d +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/5.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/5.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff39eb6bfdc9266555e584daca3ea788b135afa4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c476efffa77da857b6291aac005b325e9aea3274dff01ae947621b8a9c612a8b +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/5.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/5.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..084e70d8e5cf80d56fcf62077de589c1a10be208 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2fa420a247e967affa74a7e5f23ffdf563b330eeeb4b00b1bdb1e5c41338fea +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/5.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/5.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e28a2a08b1e8580c9b92eae3c8bfb13840868e9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:190000d4728f8fdd8928855f4d6671b1c7677c63a361fd781cb1d4cb24d585a6 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/5.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/5.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..55dd5fb171184a9209a06e65d841d4583bff3a4f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/5.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ac252b3a072e74fbfc4651d726b0d926770f49f014e9394fd7cdfc5c320055 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/6.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/6.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..37df886aca54a2a31371cbca32be5d48cc080aa8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5d44b3b2adb06878d29129882078b35dbe1a81c116a5fcb65b8d4ee86a13dc +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/6.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/6.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..48963201ba7883b9eedda4eb939643a306013b34 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea3407344eefdb1b37977d442fe59dcaff4edd22975c3c6c940652a535cc83a +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/6.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/6.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..60de2e918b4d866e8701451a54149977afaa056a --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0cb918c47196b20917eeb07f4ab92b334419039a28033380842411b5936cab +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/6.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/6.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8e347bc983ace03cafd41b58e3ac72e7688e42 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d57a45cf5992360c7e9108b60d44dc81691417a2ffb4279bf8eb49ed84d47c5 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/6.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/6.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e9756660aa8346aea8a037255e916ff93438196 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51ddcd262e3131928c71600f94f5b12d2a418b322f14b9a99bf0077ad607223 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/6.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/6.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c819cbc0fe199942181a1e6fa19d065389ab8ea0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7362d63407a2a0e0b04fd9293a22d0476496bcb6e173aa6b30bced1e4827cd +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/6.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/6.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2d47234b2476ffb805971ca409ca591c58cab55 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/6.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17eee0c3dc60ba5c48e4787967173414438a9520cba7cd65a7db4347190b6997 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/7.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/7.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..002eeac9e8a70e5271b5f5411d87d69581d2fabe --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c117de1715cf53374217caa7966ca91d4c83f50a2dbcb65df1a91e6298808c +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/7.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/7.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a46fc83634dc0449328cfb88676295a0d9f1e65 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db987e89bcc060ddc3fa0c97d9ab48fe1e3446e8e2a559be1790ddba23249ce +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/7.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/7.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1307768c00f0611944b7d4ce035d54d53462e112 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:473fff1aa636c543c80641fe10f1be65fed714a2cf8b4eb29ba9bcd2f5c860a1 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/7.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/7.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..aace36fedbbda54ed75fca01ca47272414736024 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efeb9eb1326310f2ec65fe8b1a6230a0a9bdd9778c45dc440eff6a5a7d0f5c6d +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/7.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/7.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c3d14303b04a953748db07013477b2a5d55e91 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6405f09a26425209dba0706e52a3d56546d40f8bc03a4aa1f9354ac83e8c47c8 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/7.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/7.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4520f2d01be6435a467300f5a5e743b1d3d9f120 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f426a7c1e7f4bcad1a465dccf9d0a5a79a2df7efe20a7733005bb8949391dc +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/7.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/7.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea809fdf478d37905ce687036a92ce3757b6657e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/7.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66875d6c6c75e2c6b7b1232d75e197a32c6c55d4d9ce6686d645e28ac150f0b +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/8.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/8.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ddca66c265809fac4d82798c2121e3427be3a6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b0fab0a20b9654677e4be2d14abb337b7d5c2c9eba95dce89c75f6b664400b +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/8.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/8.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa59c52c75b0a82de10abea3db0b95ff81b9e93a --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9023097d56927478d3b874ff0367e6f19f5cb8f024bfc2c13be088bc1826b4 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/8.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/8.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc5e5a198e85466a752336b49e304564dee2ee8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39ac97bbb389c8a24621104b77bdd90d5744ac3369e3e75492d4cba4c41dc9c +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/8.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/8.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6aa1158149d39288b7b3fe91d1b8e93ad3c59ec --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88f68755135b4bf412bacd01fab2b5cf29ec48c2f33ffc1ef38bec3b67b11d2 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/8.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/8.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f194a7d652ad1e5ee61b7905bf5a3e72fe52ea4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2502f683c5d937c33ec9e2d5bd7ffa4e661188078da8cedd00a325bebd549d1b +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/8.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/8.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..417e22099071ed0a09de5ff167665777e96c5921 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f41f1cfc376b596ffbabed0f4567734c530626cc54bcd67e694f60a677126d04 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/8.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/8.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a96ba616924ba156640dcce11b3d0d316812d22c --- /dev/null +++ b/checkpoints/Qwen3-1.7B/8.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9880885344e950ff637f7af76736a8807ed31ed28e439a674d8cdd8c486cdb +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/9.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B/9.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff3585c5a1cad4a2be0541cdf77463b4d8b90e5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c5f59f1cc0315df53dcc04bef48b25e0c17a404151d97004a1456d952a6f0c +size 25748372 diff --git a/checkpoints/Qwen3-1.7B/9.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B/9.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04f89ea93564d5bceb02f28a116ee8e4d3abf2e --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5fc41cb893194f0c1719d92c64c63a5cb8c7d82c22f3dd2854f65e4eeed94f +size 25625492 diff --git a/checkpoints/Qwen3-1.7B/9.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B/9.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e525487c0b6c7b6bea7d7a8560fb07be8c11c8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b58c5efa49222a0f12e464a1a7f17b2a9cb91cab93463171257c29c9f4e824 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B/9.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B/9.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d0f0d53e15335b291d8230c41db5bf79c497e50 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f14bf220d8460abd3027bd0391d8cf792ad45b8c4f306029ff942ac207eae6 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/9.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B/9.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..89fecea238c535861dae926a894aa06140c32e1f --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c82250ae8cd4e4b442d47e53ad08c70f0e6c920203599e757e46e39d76839c +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/9.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B/9.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d507b1ad3ab65d9cf2c47dce7505f396748e2c49 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f09042cd4081a15570671061fc1b347faa84514f47b8c9a21a9bce8490f0c7 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B/9.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B/9.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa13a021e03bc2bc0a01f106f45baf0ae971c17 --- /dev/null +++ b/checkpoints/Qwen3-1.7B/9.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d8aa7058353fdaee3ba614d96a7abbcd0f3b162152c1585d91e8c8f616751e +size 4326349 diff --git a/checkpoints/Qwen3-1.7B/args.json b/checkpoints/Qwen3-1.7B/args.json new file mode 100644 index 0000000000000000000000000000000000000000..d29788bc1f9432ae884270230bc23e4ae47370da --- /dev/null +++ b/checkpoints/Qwen3-1.7B/args.json @@ -0,0 +1,45 @@ +{ + "model": "Qwen/Qwen3-1.7B", + "epochs_list": [ + 10, + 10 + ], + "early_stop": null, + "weight_decay": 0.01, + "betas": [ + 0.9, + 0.95 + ], + "eps": 1e-10, + "loss": "smooth_l1", + "q_group_size": 128, + "n_bit": 4, + "params_to_optimize": "channel_scales:0.05,angles:0.05;weight:1e-5,quantizer:1e-6", + "use_scheduler": "True;True", + "sched_freq": "step", + "datasets": [ + "wikitext2", + "c4", + "redpajama" + ], + "val_dataset": "pileval", + "train_size": 2048, + "validation_size": 64, + "batch_size": 16, + "seqlen": 2048, + "seed": 0, + "use_og_input": false, + "shards": 1, + "results_dir": null, + "resume": true, + "layers": "all", + "output_dir": "./output/random-pairs", + "init_rotation_params": true, + "num_rotations": 8, + "num_pairs_factor": 0.5, + "use_kernel": true, + "checkpointing": false, + "reverse_pairs": false, + "random_pairs": true, + "first_n_layers": null +} \ No newline at end of file