diff --git a/checkpoints/Qwen3-0.6B-Base/0.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d07efc24e0bb805ad7c66f3572ba5d52cba8c1f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1369dbd879fa25799e92554d7b8b7b26b8a8663a945039565373dac2b28400d7 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/0.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8274596c9d601926c0eec3de6f3854b847e3bbaf --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387355f672b61b2b48d5ae1a42ed260324b5e3717831955a778c17aa24baf8a3 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/0.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a409062c8418d3fbc116b1225b2515db89de96 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8abf71723e41d3e773315827a0716dcada55d523638e9fdb93b339d1053d13 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/0.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3701c17848b4bbeb31f27124e4cd06255bd87c01 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86f34fe7d2b1df057401d0d2c736206acb8e28efe2baf8645a3455e70c2f922a +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/0.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a54e4a8cf74a48bdc930778215ff675d9c2619e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d1e5826aaf97a14c51d429ad1e8253b167508e2d0bc7818391f8024a1f557f +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/0.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc35491e3997ddb5612e37fcb3a9bff4e8aed562 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd176374d44c3f24d4c669907f2ac31a36ea340f6234588359edd3575e72c20a +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/0.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/0.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b7e9cc4559e8434d7f64908f0e4c4b3262db6b1 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/0.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7f4e7f5b6b092b44aa3a8b2c842db280848036af24d68c0b86cc2ac7d7d1e1 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/1.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da99c4c237f282e599a80efbb9ae986eb1565f3 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad03833a0a1979c812ef27025b60a96d52c93396e830c3cf5951b4fb64702577 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/1.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..911aebc439ac167053ced9f393537440c54517d8 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6188b69b57bd443cca4bec5e207661895adc88ef91321cf819a185b28ad9d4 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/1.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..923483db9d08f829576e52301e053619613f5e2e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f34a050ede253172a32043b2b5f2757766f4612e04112ed94018340cf83701 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/1.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..632a608e7a2e2aafca246fcaad11d706dfdc3425 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28000bcdd9f3de0047aeeaa8a9e83548068642a722d108bcb2d2ce57176e421d +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/1.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d847f34b1fb511c94cb149dc9c1180d91eede15 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2595dd0197d1fa88f031b3a91d8cc570132ff8f97968aeeafa8d725c5772de +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/1.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..19222c660b4d84eb96020caf362ff4c78e312123 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189dff2182f1b2de4481be51943314e18cb35a4757e8a1c11bbf937870183aa3 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/1.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/1.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f351791d0b4b4bdfb578839d72965d536a2eb971 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/1.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292867b94ba25d2f0f09fb96ed607235b7fdf43613e3401cb02fedb17b633743 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/10.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09fb866dd27e248b370e1255c1b296d94df300a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253d9daa009dd61beac9f0542edaae06333c04671254a64d18022a564945ec93 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/10.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da9ce71c1cfdc43d2853ecac45caaa7489c8d3f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fbd855ad1912f1931e052e8053bf0b85c82f24eac18d116ba2098bc26885f6 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/10.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f18697258e4c22eb3eabab6710bbb3430763df83 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80dec41020704af3a83bcdbc78e4ba4fd260823f9311a02a98b0ac2d5495b0fd +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/10.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..16ee62d9f3ddb387a14dc1bce3ffffa134197e70 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae83825f44b2c04aa28331fbf7ef3efd93262e48a788dfcf4f34f8374e7142d8 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/10.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..942f60d46e8e1e8c613e3885f47f9a77c726b144 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829ee92098af1c7d77c91ca1c26af3b17ac069ba5ce7a627e774a657cc92b1cd +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/10.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d86a5e2602dba37ac5017ab2b85934c21e2300 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efefcc2aa86d63972f6fc3f13f4601761cc71fe0cef68ddab5c0bfb77bb7c757 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/10.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/10.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed565816866a57691328ab3b8bd7d99f62eb92c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/10.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01fb0daa06885033fa39e521d9e5856bcae27a09773fead15d80ab58e5be7e03 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/11.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..86fc698a2c3474d822c0947663097ead2ac3e013 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d3bdc27827fdedaf966f04f1c3be2c5cde24333aad0a65e29e885347772d8ce +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/11.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ef4219ace021b12b13a17b00f5281ce726a5db --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae29cbc583e10cc24f5939b5943f302480a097d4094f1dc140ab7ec22e9c2d3 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/11.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f549710d9e306bb579ec2e4083171ac7738b1e8 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671902199b0e53a25924baaab21cf7faf7b7049d30766e351c732f802e932b7a +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/11.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3ed5442f9ae48b790e01ffdab094f3086cea4e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82816f147a435998a185b9797b52f28d5cf2ab33ada9089d32c4c258473d535 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/11.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..53dd483652924dbc34aa77175c6344f934e0780f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ee54b79d347b70646904aa201dc9cce62ab8c29394d535aae9c5c468f5302f +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/11.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..83ef6addd78562c86b94cb94ef9d623b55b1385c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34d3838af030b8f115464050f5966fcb4975e3b021d7fc31596f21b32c826f1 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/11.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/11.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0047f652ada434126983cefded3b25433b622c04 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/11.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3e9eef3696344640adcae60cd58e159fa5d4b77d18c5365bb8dd152906c8a1 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/12.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e1ccaf6dbcd8fed60a1876f9e417e3f8a643e0 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f6c16029a1f05bd86d5e60ef272eadbaa41964426403376b55292417979907 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/12.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..779984001ab4555f2f367d28e9e8af73e577a58f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07090fa125608c5c0b1902183d58a8f023531e0d00116616d136daf247bdaaf5 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/12.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..db186d91ce57fa80b9ce74ddf646e3136673db81 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18b5ff4ea8330e1e61709cc71d9b2e1eb5e3fc7b725fc1c074ed2ea834b877a +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/12.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f4c048f083818753df928830ea43d72d1b0920d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a33e6da0267a1a91928d7c8a621029daa3b87eb59f4e07acfff6fccddc09f92 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/12.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aa15f60da0891c396a3d01cf5b559f9971da803 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef18f7dec645d0c1e4f3f8a8f4690b33aeac4c9088eb94e08fa925970ad63961 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/12.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5bd54e5b610292181a5afe771d1d3a2d90ea014 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8055172a003378d7f35a97a09465718bedcdb5cdd76de288e3829a3d0d695faa +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/12.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/12.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a57da5ab42143002de4f78a6549dd6a60992371 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/12.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686f88e0be77ecb9ff167e113bdcdc2708be63ea5e25e985e7a75578c81b0fdc +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/13.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..939076220502c683e895a8c99cfa1d6f3a6f0c88 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c221f4ac7bd38a150102a350b2c7efd2fafbd0ca366418a7a150cbe280bb9abc +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/13.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..28325ac7310ed5f51d7c7f122928fb7270c576ed --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb15aed60536fb3a63435153b48f3f5a814e0466dc3ad8b2a523564f2d520ce +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/13.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fcce444d73e179e693fed987a897d31164ecce6 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b85ad17945bffa4d2e813a075b8c40061f86a41cc9ac24f77812d85cdfe0e1 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/13.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b45cdbaa66b50f5258ab16984bda761d232002 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f76efee92576f0048dab0ba94c84a1fdffa27ecf23d59f6b61f63b0a234374c +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/13.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9ff8fb92a2801ac97e244d914e92597962114e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220a1f595e8098e4d41df137beb67a10bd4de561365a85aba42b44c3c94a4514 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/13.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2903f50b224fcc46ce62854a72063d71140c1bba --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be58f808763b31d84866b7258f6da621e6b524b49b171cf34b620a92d58e960 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/13.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/13.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf6e897fcc74702ce297aa9835df510118c4eb42 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/13.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b669cbb8bae016b6694bfe4c0d12c67f64c2666772dfbd35215024dc8871ff99 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/14.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec286757a3dacb2f2ed5e4ee33cdad8ff4be6640 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0287a53a82d9b4b5c0f8fce32e06858fb8a422d42ce488bc448701070eafd94b +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/14.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..08efd68c6e3488462051ae88041ac69f60bfc5d8 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd1b946e5ed93cbfb459726d8551a0e76cda0cc94fc911039d80ef07c72c2ee +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/14.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6000cfa455a4c6fd079a93baff784ee1f9d5f6dc --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca912b7abc9dda34e682646af468f8f98f5194f7d931306db5f4e3469cc5b5d6 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/14.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..66bcdd976b4597a38c982f760c437d7ae42af614 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b2606d67e4a0871e7b78c4a43c1677b17cfc2f0186a809be10fb405c766daa1 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/14.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..716ae32b5ab9712f2180288cfdf883f06931f11b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1802a7c09e1677b007bffa91912bbbd82f8e892edab94f56fa061f9182e55ae +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/14.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4c01be2ecf6eaf2752ae3cf5f37ec9d596b31b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18183301dab696da7a91fb42adf55313a3a609f5c42a33f4f7e0612f9821e89 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/14.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/14.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..11bfc9f3ff6a41e67ac507014ab823c96e6c2882 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/14.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1e6934dbec780b49d92b2e4bc8e688709445b8bf25736c738920192e2fdfdf8 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/15.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b646d8b35adda02cce47782062c69ffd008e97c3 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e993e30baf0d09132ed670a6cfb7ed5e18cae0023b8a51f89cc4c4bb9d83cf10 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/15.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0012669b6f55b5f27bf812c1304dcfa4163494d9 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9beca61203e6a0c4f0d2d3b43db1fc042ac340cf3f7cd421817c70403a4f9641 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/15.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e27baa454e52fc654f8597acb87336ff10ffad --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2a12e89be971a8e213c06150f51b929c7f932740ba193282afc75641409e02 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/15.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e68eaf8797c0cdf82f8d94afcdd343c725b919e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5eea094208fea9a398ea346440455e0a79177fba62e9a6226005faa92ffad9 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/15.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cb7681ea257ff588a10e91be6b56f2b3e6c2e40 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe507f499c312189c0af59dd21a89415e38d8fba2a95777489d742bc40c92d3 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/15.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a0ec810e32ecd7389596797b71ea7b9f86c90af --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:badc19f0e7cdd8661b978cd9e1edb4cd31ef861d4974e7b2751cfcb1a5812212 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/15.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/15.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8e9c592d775cb474dfb3737c9c561f2351bef91 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/15.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150b93b86355ad9b8107c8a7466481bc1a4a71ebf023f83c767c10d669f852fd +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/16.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e52ca951f170e29698fbb890b02924f60393840 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087723ba9bd2ad3b1a184e6a8c79e08f200cfaa33307f0a79ac92ee2cb7e76dc +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/16.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f226654584700c3ba2ac6e71ea4b6da1f2b1f3ab --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65562aad6b8dd5b547ecfaafb49f59100232a61ef7e0fcf474ad412600504b33 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/16.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6a7fce9e022bc4ff92dfa816f2047ee9f82986d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0107d1876bb49ec3e98b92a0f5decb4d486f01ff14133778a8bcfe1f3921a112 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/16.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b21fb49acbe7ea3e3c96b64e904b3ae762d03e3 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa0becfe4521a26ca5430a2560f2042fb7fd2c6a982ffb1148aebf72c3a9b1d +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/16.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..edebc86152e3685cda0f63e3d78c09f5ae7d0be7 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909bb2839e535b81a36cca77d690aa3a96abdabcf36761f8a14e654236cc9d6c +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/16.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab0a364cd726b205f6b0cfae5aa0a11113045d8 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35f90f42589b2b5b7b8b35440931637be55a7e69800265423531ed9d49924c7 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/16.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/16.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0af756187f0092e9b77f36c7d0dc7e609c45daca --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/16.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d525870d837b9efd48b1bd114eeec1367a0236b326f027c0f9f1fa5328f9f1d2 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/17.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2933e1deed7cf7f54ab2f67ea1a001327104fa32 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fd73ce28ad3bb7d477be6ef31001819fe6ac3b84d1a876a22cb3ed8f975ba65 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/17.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a189bcb846595b49836916bc1c813ffc702f172 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1518c4755cebbc14d753695dc7e4d017bce050685af885e1023085f9014ea07a +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/17.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a90b94ba0382f36d63f4247847da285f44be269 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541991fce335e3df8b3a0eeac47cd86e6207bb52b1454f4093f69ea824c7b1bd +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/17.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e878e211ccf5fab6a2d3476e8084466860d7246 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334c625a8bd0dc2ae22418205dc13042be21688404d8a351e08d8ae06ab0224f +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/17.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea9331325a3ae2759ebe9a0706c6f39a559d2435 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1129ca251753d3af8a99815ee1dbdc10f4df4829c0105c252f3445ee8bf3d74d +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/17.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb3cef8cfb408dc1ac6a36ffbb5262fea530369 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45dc41fb1bcf03bf42f1e49551e47bcccdbd980f49d21f55c714ff283a11e06b +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/17.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/17.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f7842b0b306b746a7d872f5696b8322bc19738 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/17.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3fa395a23fdd50e37483e8193de6c92a4efb03645e2994b3048337b1af0a480 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/18.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c0d634c131d4c00d5dc8ffc80e38fd9b236224 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49cae44b0357c8c2f0f23754b3383c60439559b04e09c84033ddb1a05910d95e +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/18.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb2226efa7be0aa0fa0bdad131f33f1bf568eb4c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778ea4d8f9b0e2b6689fcd675300af31780b7db630e0df6222001aa00d68abac +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/18.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d035f99840e5b6bddae5d7c7728c0c29793eca2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6529b8537cb5ac0ef6e74828f2d148ef4a595e65c2914e9709975417978d5b +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/18.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c9464645494cff0b34a0e1e799a920d6b7d7279 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b55e1a356fcee779587f0f76fe794c89718af4b2755b4c30138d26b1032fc6e +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/18.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e1f2dc3f975577ea27306248ce02c84ab413b1d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b106cf27cf64eb949faea78b01f980ccbe6b3918d5bbcc3658a9e3251ef654a +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/18.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e043c6211d94670e264a4b005c80b2893f566be7 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8337e52f991199a6aa11b628a265869f5c0056aee39799992356dfd90dff2d0d +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/18.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/18.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..72458dfd10c13cb30483085bf1a8299c1504ad5e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/18.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130b08d530413bf6ba039ad63b208849c1f2eee8b069c265a1f448765e5855c5 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/19.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b016cd138e0656c13e723f3d9b0697bf817e57b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb32658ffcf6adc6c0580b3d5d2d313fc002d7a3ef3a7692ec3e5e7530142fa +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/19.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ff0fa2ef3412323f4cafd22282dbcde37bb52f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11c9c9e82fe83ff8323066b72995b2a535ef2996015502968c541e491e0232cf +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/19.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..82ec8f0995c5698c32fac29672fa986e603ddef4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08915328e6edbf9bbd94e3a88ff11ee4bb2f25eb76a7de13e0b606cbeca3043 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/19.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3a1f0d5c00037ce98f22b533869902eff53656 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7825745809f6b2b1393f282bc0dd94875f4fa12898aca759327572e15040d90 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/19.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff3af2b60564144093e584452f8ae0db76c2cb4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6642d80969a8e7b8820b1cd6508c37e6d4e0b38902928e135f2512770ecfd78f +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/19.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e4b16d7e2d3d5fbc58371a5007f8b3000b0d826 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d355a4013a37c97dded053929290437a0bfe791453913f1eb97ecf2253bb476 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/19.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/19.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6044dfd4b9dc3fd0a974ff2ceb5c40d0969ad8b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/19.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32eb7e5c7fdc5e54cda0b59990f2b94c3302524b9a1eeb9bb281dbebb1ec673 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/2.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..02da98d95c13d178b9960b1b034237c247fc9349 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8916bef968054292eac61e913bb8fb5a1685b1a224bdc8e8c19d2d1a387eb54 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/2.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d820e9fb9c1d9c1bc8cccb0e02c7707bd3f2ee1 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250baca4f9915c0abeb84ad377e7d2a3cd00ad4a74eee6c722e6cefd0bddfe1a +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/2.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..10d06f95d8f96f37a3f8f8ad243117323dd2aa60 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939fa713e18412ef25f620ffe8a0093074461c6a67f3765d77004469768020b4 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/2.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84814dbb47639058cce2664e8c7c60bad18ee30 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ea1a9e420e35277e60b43981321bdf1b46099637e0016e4217fc6fc2976061 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/2.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3057c4c0f70b37b8724fe289d233f5bd594c26b4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12571bde641b56a1462d69db8fbc3f79f6ba1aaeaabdabfaaf8f8d3d9a90a092 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/2.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d668c22224c478485caa174386e07989173ae69 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d4f49ae667186eda28c1aea9f20b55016c7287fd81b26a7380effa0e7b9b00 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/2.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/2.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe022895e93dbd3b7bad8b08a1ab4806a15e91e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/2.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b729935bbcc71155cf0c63fe4e99c2532d8798ef795eb5b628947af9a889c42 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/20.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef6334d6da8894702e55a2d3c2320047b171c1e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e6ddbb7f0a25c6fb48112a19ac204abf62935f1e805efac4a89dea19feb24d +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/20.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9355e1fc61079d793b2e9f4d3e1346baf50ba97a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ff9b9a89b9a8966f57684c21d9006f505b379ff81da7a405c3e118643b0aaf +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/20.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f106ac77dbdd480ccbb372edfc737ec861afa047 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c627de7671cd6bd9bdfaba31200265d45dfb7032ee7120e0dfc2b3e3c473bdaf +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/20.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6101191cbed12b0bb82198aa09c302dba6804047 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ec3b062138e463f7830ab7e8ab0e38ecc83955eee1a04be5f2d2584eb54d45 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/20.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cf0e8c3b0e25278dde2550b6c4e33a3d1bc7a02 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1266f58c83bf685cb54d84a16409f5b6e825d63ec0b206bf9c0bcedcc8285a83 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/20.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d5204e5dad7349aabb4919659ec3239b49ed00e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06263d636003daafcfcfa23b67dce336d13c8c0eabaa4a7ca551af69605ed5c +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/20.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/20.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3780642ac73a344b00ba89fcf92f0891f35c969f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/20.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85274dd32069370511117e28ccf70f41585847073f075b40513a21e8b95bbe7 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/21.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5037a9217fdb57b189fcc9bdcce2325ea661baf --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559451822aed987ddad296f124cf7e4d11147d5288abeeb8ecf3b2476f2ae0fd +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/21.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..63ed2e8912b4337217f11746594963e586752d2c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e491e4f0c0c7d856b3fd49e18e0b652da71ef3417be9a0ae6da379cc659259 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/21.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..05981a3d81af28b6c244b9210f7725331499945a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228d8ad09bb714dec2319fe1a2c280f2fcebe84537499f672aff2ec42c7d155b +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/21.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0b510585ae51d8380a86b910dc67cd9979dc4cc --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584327f73f6f88def0280d30e216767b04b0f58ebb993476a1f907ab5a17f72b +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/21.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a30ec1bdcea8c58fb6f98140c5dce46b48c689 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1592900fe03b2f72441f4fefdf0fa8109cd09dd867bc78429cfb671e2e7c59b7 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/21.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6878ff3c650aa908594366b080583efdbb15856b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78678b576e3af220019ce1faf8562b7260a15c231546876c91744732c022731 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/21.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/21.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a63b3eebafea8ee92f454363ad250a9cb51033d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/21.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051ae2211e70105074f13874539d74916d1b7e2015fa294826356ff38e70711f +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/22.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6defe3a0a9a7fe342d19ef15f7a9748b0dddb21 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef9e67e703239dc5a90ede6b3b357624f281995991251a34e6d6235af6b00db +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/22.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd946b8311600568ba0705d2bb62dadfa00f1b2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91519cb9f605d41ddb8eb0d209c00ee7a538cbd5531b861eb5fbab4b09fa87f +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/22.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6e86e1a2f97c2f212767b964a8180cf25bde7e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b225b49da4e87b970c7dc4112389ce56edeb81f728f7ed1b0343cfa337337832 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/22.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14e03148ceeb2f4441ea112deff70b6fd3966f5 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46db9f2f042b0783a121b1c57dbcab12c313b4fcfb3c7300c9a79bf983c957d8 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/22.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..436688c3bc1e182303d31353e5c7a591854aa967 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b91da173e001d319708d49d793cbbe5fb70269bee3c0c395eac3da0b9c5455 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/22.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf9d7cc7ef449ea4d3502fd2b5ebed856fedca54 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d140c580994c1b56f75b0a4d1c392bd7c7e7e14448d2b0ff92ea59e94516498 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/22.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/22.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..38eec783a8972e4426d0ac9040c1da77b7ccfcf4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/22.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87902d448ef4bc6f23087bf2d2853cd36a489682aab6a2d3751fbb45557f1833 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/23.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c1e93cf67d134cd2a39d2045874a93e9b2369c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82221555d521973e253066eafa6c3d360fca01d54e1611650f80803ddb657c86 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/23.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5826a5a036cd81a8bc6fd558f76d3f7ef914984 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5266c6879fea3fcc81b77df29a9aadefd06a755dc3ab8c2eb4bb272ec0c5366b +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/23.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c6e7a5703aff454081efef1688b3ddc50861bf2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400a5f6248db21762e00fdb6158e9487411828398b04b825db10c3d7093d9e08 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/23.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c29e3078cea949db4238d04a1a2b6f8299c8c8 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb657c422356e75fef3446505f0d1b8967c002c6f9b2ab76c2800eb074d7bd8 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/23.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab95185458f5ba81e9e6580a8999d1509d907cd --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b138d306fd4612343dd9b3601441dc3950ea690d002d71c2ea8d4f3a1ab7e98f +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/23.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..848268a89517600f2d8968ec9b6261b0263de23a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747a9005371a0a43a943e55b703eb6ed20db2755ee7150ef94bfcff597be1c6a +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/23.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/23.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b12a4b08906c3be5df349c76b4cee1b39912e7e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/23.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c5402d6ade26abecc42b29701e0c00d804c18e83d32c598111e871c23b30ae +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/24.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce86568156b6e461330f4bf0f30b3b09eec16bce --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7670642da9f976df7778673e9bb60d93f42fc5b32160e031ab537930263ae89 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/24.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1c457c5fdd6818c630ab94ca0615af7f4b14d9c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d5c7b0ae0d5c8ec1bde75cfe263abfce26a027ac72542ce6e7ca3db0bd1b864 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/24.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..550416d88e0709a50baeaf5291847425adc74ba6 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e21dd772179520bef95fe7a7dfe2cb84cf837a89ba6cc0420503f739ee3a8c4f +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/24.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0bddf560360fc0daeaca7004aa4e75a3f63bd7f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98aba6edaf71a2ef0c614c3384daf361252272c0719981bac611a644f295d02d +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/24.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dcb6158c1162ad0293520ad76b4374a76033bfb --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667a14d459c9249b42a7e6da7f298e26d8fd64713b0f321dd31f172b39479922 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/24.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a158171f512a0992aba94e2038d63770a926056 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f3fcfd958081f355d90a06147c7daf0fb740c8db979c210f6529be3d438b6b +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/24.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/24.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..84dce61a3a695eb09dc310110a295ab9288907cc --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/24.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a49d10e81adce4224c51e29bc296a73d01bc4d88b22c6131d25db6a7f8ae10 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/25.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b778ccc1dd3dae16ba1ee348294cdadc1ebdfe9 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f4aedf4f07ca8440c90fc49c5595b1d653373c75c4f674ff7e40e88a82b008c +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/25.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e665a615c24d935989edc3f11652385c2e662b0b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ad483bb4bb13bac36defd55b8a8d166af11815a3031dcab6715b9bc470ff6f +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/25.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd11effb4c36ca613c97642f5218f00f4335ea55 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c42bf28a1e225844ca61847177be4b5596cae2fcac5f9662cf82666d77cd2a +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/25.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ecb60f500af258fec61627dab089436d40d79a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da59c3b19d9954bee49b0a4da18a4df09150a5f3394feb15f2254f22de6e0267 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/25.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8fdf7060f32853afde4ebc284191f1769eef93 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf946ad9886136c95db5a43f6d8202bd889e2badd0f058b1f7081089a2a9d8f1 +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/25.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7246cd6cb90410de5e3f9e5919a5b2d515117aa --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff47cce0b778b20daf84eb354588fd37a4f18cd724446864aff4c231a36b1d4 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/25.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/25.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..83716a9ec45323c68dd3ce6083144d6a2cf99166 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/25.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c50febefa845190eaf0bf634653bf8e3ed9adbdd82167aea03142df26c2cfef5 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/26.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e0bb773b84ae30b78b9aaceb25f0b0d7cc2a43 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0373d4f78dd2b9e445fc5354792a198cb122408c6599310a16cba0ffba2387c +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/26.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fd57173def9c10f3a2871706670130def981087 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d328c7056df6528280b15b3d3791d6884e26149e64fc1189683b9b236a6e88e6 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/26.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d481da37f7acae30de07b5ccfb20a73f74e4e93 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5523113148e3fb7d45091973ee8b1847563fb7df8396fc5192447c529c9f7287 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/26.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..49b1519cd75415c962e7cda528ab503e34745350 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33cf936256f0ff7a7e2ca905acb8c58df860e18f1d6bc862277f4006c4215bd +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/26.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bdd3fb08db571c461c4f9cb948267252bb2bf24 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19b1be7035e55c6848fff6fc5ecf8fbd82921222f18022a6c86fcc272fdad90b +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/26.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..10dd6160c1c04eef16c93f02e26fe05398bdf5ab --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ead1950155c7e39927333b1095b8e5d5c83f12848ccb5d573dd4c69bc10b37f +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/26.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/26.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d74a5fa7f2780f11478fef8d509e78409b8ecf --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/26.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb47790e75612b6540fd03800567ba9d642a268875811a3139459ddb14b25c71 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/27.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..537fed3782b0a70be9564d6234888e4b3df340dd --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:912f88b82452f9b228c10fbbc78037fcb2298b019c4d4e7891e2e83573ad0969 +size 6486951 diff --git a/checkpoints/Qwen3-0.6B-Base/27.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..550aba24e2fd2f61bcd2b724088de7a50b320b9c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8509598b3923196310e0e049a09b019430a1fed0e436ec380279c750720d31f3 +size 6425511 diff --git a/checkpoints/Qwen3-0.6B-Base/27.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..990ab96bfe860aab521cafc5015958b7f0e31d71 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d17ce8172f21162e88c1953a52ee45ff54eb71465c3d97fb99855aa37dd34b5 +size 6425473 diff --git a/checkpoints/Qwen3-0.6B-Base/27.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..070d084d2606836785d6c00389c986edeb9dd88a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d8254c06895f8c65163c261de65cd351032c7a33450d9dc933e63735b44338 +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/27.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49e673545a4de4cc61d544a6cc56270d426980b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9868309383e0ed11680cbab559912be2d2d1c9515ad5ae81f32575d3b3e4ba9a +size 4326368 diff --git a/checkpoints/Qwen3-0.6B-Base/27.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc17f81b627401693efe1d65d24dfb6fc3add19 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1d7c4fa2a16c46dd218e7515a8149f138a084299e19223b1c8222635d70001 +size 4295648 diff --git a/checkpoints/Qwen3-0.6B-Base/27.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/27.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d8da82f1b3622410b4d10f507530096b3d57020 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/27.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16e9b0760143d8179abd46cae28b9f4efa7d0b9a50879c7d7f76638eba9078b +size 2165728 diff --git a/checkpoints/Qwen3-0.6B-Base/3.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c294b2428f5da0b0c4755d9db27b41fb248a7ee4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4839c6804294d5d6ac20cbda0bcc0bc2f8f9fc8b5bb3a94093f7b36eac6cb30 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/3.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d56351375ddddd0660ab8b86418eaaa164d29b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5fa12418e80392ffed46ac9dfda6fde8b9bddee8492894b10395444e1621bd3 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/3.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f2bd05310bb004be262e09af0719c275c39d838 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6231a7985c15c8f56da2e79a231e3ed803003c4ff3721a610a2839a2d33437a6 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/3.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d565dd6e2e7a1ecce07265232eff61db7a6f2d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c116412e8465a4ceddf350c3480fd5b97314de0c218e19a34aa0e2a7257d2633 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/3.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..022a82d053ae3183b5ea836587c54eedd5dff2f1 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61193d748a9ee96701f8928bb05d7c84e8d793f13e9f3a8c275bcc8d26e111ac +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/3.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a7fa4757011cb7a2aa55bb3b6ed8b1c9977762c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0674d88329af03ab4f27ca29541dad988ffacb2c5dc55e9fecb21fc16b9d5ccf +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/3.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/3.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c7b4f7f9ff9fc78960bb5fa3f64af9e16623a5 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/3.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ea42d71b72a767af2126eee8362faffa6093c6131384ccbc00998921d492ad +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/4.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd17f8c67e8fa3e90bcd28bba88809c969060cf1 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d14337a3c18effec79af64c4404bcd71083dc235636166e4686b91fb4df8c97 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/4.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9196b8ebb8e396197696cf1e6bd2b0005d77983a --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9abe92750d59fc83eb5f89e40c9ab9d7b28ada53b93417b90bc0818adbf53d +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/4.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2efd8a48785c2b3070cd1904c6b2ec50eb03816e --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc06935e1d2eb7cbfaa1bffca83d36727fc86ffce0f85162c59feaaabaf5bef +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/4.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ea63dae65b2a80b9ac84d85304775a605db2a49 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4460fe3b5be62fcead14215d71f5739ea828cd1558afb4aec4886249368d307 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/4.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e13b53fc94b5f1724caa86f934b929bd186bcae --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b6b4369ba0fb186e565766ace347b150d87cd76ff254e0522ad3b429175c51 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/4.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8c9240cf3244280b3e7145dc0c4bdde303e3849 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d021746ec6d89b8db327bd6d367d96eebe77b38817958489e7d809bec10ad3 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/4.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/4.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0ef593bce1d7e743071e916486b0e3e786d07df --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/4.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1de17fce5de88d4786c2ab1a1098a0a9e188f32d9dcfe823118cf053b24e3a4 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/5.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b279f5607dceb11a47442d04ad221c4ea00c857 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fc735b00ca349ad3d71e109a64b642c845bd6e58c3dce79972eb7119192c32 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/5.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b25e3d11f11f03c7ef8b12112b3f861c53a9c46 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5123ea5b5ed5bfebf477355136704c09985694857ca2d34d33c62088d98d268 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/5.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1d5e34a9e8b128d0420473043c669e703eab2b --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ba7a7ffc5b771d13a708ee5759b3fee278ea37f447a9cd3b3a7960c51e0bea4 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/5.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..efbbed9da788b9e212575a49f4e913d503440f16 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35eca987706df2e6b27ebabd09907802688f4bcf867edbbe3f8c556e812a5c2 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/5.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdef536ba3c2e60cab0100d9518e7a54bff0f0b3 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8826d5c758ce65dd21c18d9e6de7228a6906bae2d1a64dc6d7ed556c570dd5 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/5.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad9693b8ab477425e8567f7ea12e5671e5221b4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b82d744181e7bf66cb188f7df737c8b6af1fce985239520d6b25146a159a532 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/5.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/5.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..85cd338041777f8843f154f22e4e09c0108a8fa9 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/5.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a5ecc91847212aa17354be090b8108863d6cecd6f407ddaf15ea33e97642ae +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/6.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d34f2676f71a7baec51fe4144188837a30d1436 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cd7bf47b5cad832c7cfe0e3e56c34f499e0afda8c9f85112c6a9d448a1a158 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/6.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3476c3f047d4ff5cc945088405bdec46788bb7c2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1e9a88c42428497dccdcbc0fbe34a9bd34b8870fed1682035d65d4828997bf +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/6.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3964a4085f50847e02ab8f35cac69d7d2b26d205 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8011a547fc4d963568f410f09eae5ddd691b2d06a750efd396fead72b5f31ebc +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/6.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28ca86d7c2333f8224aa885d9961233cb923809 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be862ec5c297754001f1e7597608b5016713c24a7d19d894228dec47cb71fe7 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/6.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd02edc6ec936e408f7717d97685fae409f244e4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c752363b2151508b7bc295834d066b3e83b914a85339b7c3dd3fa1583f7b56 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/6.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c27f73ea1a8d5729d4756eba1c06c5764d9760 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977f284c06b14728df29ce9327cc72d2bc739efdf4d9d0353f245ea487827eb6 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/6.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/6.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2deaf9933b7ab9c082cc47a978d285ce2d27c03f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/6.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d0dad2caa6af4a0605dbea794ac2ed00d0e3148fd1e5ca9b77d800e252a20d +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/7.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe884e64922496cec5b3c19cfc9b77ecdca634d0 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d47d5fb18c2b5cfb5cd4937bcb75a388235a05d29d90ba8365c1d716a4a72766 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/7.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc411387b9f8b28cf6b6f342da9bedf41538057f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a214a7dccd4b835034215fffdb73ada16f23b31e4c70fe8f4b430310ea01152c +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/7.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..019ca42fc0eeb6d0abcaa37f4ff08dcb6a15bfb4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d6eb24955d07d532d92c229da0994f6509db77acc53a67f7d3797defd88f49 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/7.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f18acd2ef899bcb8e4a1fd164d24198f5e2cea --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dfc49d70bc8acd9ac0aae237c258f96fc3ce4600f1f164e6b4dbacae46bb01b +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/7.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..eea2cd1dd2f077af6194da0240e85b7e78c6a4a2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04444fe0478e8c47dd600a19195c38fec2363a787cacad8814e31e89f9e53600 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/7.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a355d3bd3d93ed7a24a9b0a1fa3dc665c10a239f --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f3212fec465b2f022874dd616f0c965a9704222187541c30072f6de1600879 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/7.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/7.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0ba4a706141a6463796106c01e16dc8a4244800 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/7.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9708ffa25ce808c76db3b65b86c6e2234b56db83aed0f47adbeaaa6d2039b488 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/8.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb04217bbda404a1f2444877342b4f68be186007 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd69d18ad7f862b49f26daf62d1af220f00e445df554c6bbbbe1925ed3ed654 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/8.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..584b778912105adb64e2740028d80ae7f1981ec6 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c8ead438cf5b11bb1f09bebdf51891c8cde6753950c5624e033318ebd3fd38 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/8.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..76e443063eb00c299f1fcaa17c4be476ace6c7aa --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f6c6d956d2ff381832684a14465ed631a4be101c84ef43f89f7151b3de91b5 +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/8.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28eacb5eed2dc0d8d1b8cbe2fa7b38a39758f27 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89fd9f87f7149729c6217eedd067047d7ae6a985540fa4fc2d803b2fce562c66 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/8.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ed84a9b06bc07caad6674dbdeaa2e70b0023d6 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c03c6485788c3dcd59ed93d8c21589430b856c772b0981cd21b2af2b564cb9 +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/8.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0435fe44b64dabf04729da2832739c247aa6552 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a985bc7d3555135cc8b8dc994149092bd0bfa2e29e1cc46c581cac3c8d0b720 +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/8.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/8.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e9b8f1e8fc660018b3dbd0b5427c741d00c45d --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/8.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440ffb3034be9ec2be3dc6930bb588368327673f244367c680832e60e63eb34d +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/9.mlp.down_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..669ce0551f6216c3a99d794e7d6d726d752dbcaf --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c8d5f8c3c1413c76f4f215954b3237f6baa635f74665cb8514c3d47690e0d69 +size 6486932 diff --git a/checkpoints/Qwen3-0.6B-Base/9.mlp.gate_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f89b26cedc0cc7b1711355ddce9e96f82293cf --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65340ee1af785fb47d143b070a17f7a296c947594b83c4662f6fd32c6966bc28 +size 6425492 diff --git a/checkpoints/Qwen3-0.6B-Base/9.mlp.up_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28d89678e16aaed1ad7e185ec03c1dcff821ffa --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2837232c56ec07c2717638399abe0c4595d535b1b5afdb75c5765d510bd4391a +size 6425454 diff --git a/checkpoints/Qwen3-0.6B-Base/9.self_attn.k_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2924f1193cf4abaa86b7951e5e6f86a1ac1382a2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b072899dd6509a024479f5bf6bc97220594033fcb11b10f1c198723d449af439 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/9.self_attn.o_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..402f8e89cc364ec4d42815154b4f3f33a0df46d1 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef07980e67ee2e5ee2a8b5534053096e38cd5bff921a50715b90fe71b30d66f +size 4326349 diff --git a/checkpoints/Qwen3-0.6B-Base/9.self_attn.q_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b66cac5eead534a041508007eced35b1301eb4 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f286f9a1b3cc2917eadd2b696c41beb55c675d0e4e32b22dd8a9c574e6f58b +size 4295629 diff --git a/checkpoints/Qwen3-0.6B-Base/9.self_attn.v_proj.pt b/checkpoints/Qwen3-0.6B-Base/9.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..40ea1ccc7ab318de3f0392a2f640eb83410ac2f2 --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/9.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736184635f01ac1b7d8d2e2cf20154c6898af70d730dbff8e3a25fe80c393250 +size 2165709 diff --git a/checkpoints/Qwen3-0.6B-Base/args.json b/checkpoints/Qwen3-0.6B-Base/args.json new file mode 100644 index 0000000000000000000000000000000000000000..94e75e53d68f291e0f597c72b126aa975661579c --- /dev/null +++ b/checkpoints/Qwen3-0.6B-Base/args.json @@ -0,0 +1,45 @@ +{ + "model": "Qwen/Qwen3-0.6B-Base", + "epochs_list": [ + 10, + 10 + ], + "early_stop": null, + "weight_decay": 0.01, + "betas": [ + 0.9, + 0.95 + ], + "eps": 1e-10, + "loss": "smooth_l1", + "q_group_size": 128, + "n_bit": 4, + "params_to_optimize": "channel_scales:0.05,angles:0.05;weight:1e-5,quantizer:1e-6", + "use_scheduler": "True;True", + "sched_freq": "step", + "datasets": [ + "wikitext2", + "c4", + "redpajama" + ], + "val_dataset": "pileval", + "train_size": 2048, + "validation_size": 64, + "batch_size": 16, + "seqlen": 2048, + "seed": 0, + "use_og_input": false, + "shards": 8, + "results_dir": null, + "resume": true, + "layers": "all", + "output_dir": "./output/random-pairs", + "init_rotation_params": true, + "num_rotations": 8, + "num_pairs_factor": 0.5, + "use_kernel": true, + "checkpointing": false, + "reverse_pairs": false, + "random_pairs": true, + "first_n_layers": null +} \ No newline at end of file