diff --git a/checkpoints/Qwen3-1.7B-Base/0.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e7b2621a9b7df35be503fe2911e79163fb5635 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51cdbf0443ed53f4dd7387fe25265a2c83537445891fd48a2690462f52d7315 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/0.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ee3e8c0ab7eeb7cd000f39b192fed58dc0d6ecd --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f6ee6140fd81919231da5e41eafea9977130fbd029c07fc1fbbe734d78fbd4 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/0.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b22cd8829647f8beca12127af92d925d653c153 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a50ee76bb08ad4c57c74029e4d058a1031a9f9dd24a7f077093f1f578e4de2 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/0.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4d61d3d844b722ff5bbcf00b95eb3b5edc394d3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a549b3e8d1ed4d04d829ee1e5220b5d2f9b8e1e9d44f9f8c7ca78f3726aa38d5 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/0.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..83e9761427c3f74c6e80a91a1e03e1bc57fcb02a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba70038cbf2eba7d944a23b3c835a939c500f85131ae5f2dfef7cca45f77ee2 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/0.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98eb423101351ed80a78a7d56815342fa10ba81 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b6a2aa1ed20562c227a3bc5a1d7b014a15dcfb9257eb144252f1c7e6b5266b +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/0.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/0.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..42f033e47cb94481bbe6786003121b5117759d32 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/0.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933a7a2772ef2c9f540076bc4ad5dc92b4ce7c6a224baecd041a70ffcbaeca85 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/1.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7812b5ce987746db825dc634c11c8fc18e94ab2b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e23f2d0547f0562b4d48d41db3b4dbda955bc8393e23c6b2b9f8bc32a8d68bb +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/1.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ef954a981252f63fe93ead7c2e374f672a9d1ac --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d0e844382c3442e4e20af981b2dc442958fe0b7731a2bc1d78ee54bca57034 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/1.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd4a5edb7ba649a95a3d63cbfc402e0876f892e3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0909725ec36930f2906fbb035a4eeb97ad38907c72c2813ad074141834a7075a +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/1.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..399603300301274c47464503bbf508a6872a2478 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3569a558414654757367111ff47127c062e68561a6819c3f7efb5fda7fb3d5bb +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/1.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac1828e22b2b988d43bee803ad4c3cb0dfaa66fb --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df1eb0c7d7a4007e6a47658f70b572c6b22f44fe4d2707e4c12eba13cc0ff7b +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/1.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b256e20e31914a15630ad295962f8471ebb1ec4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38b852b860c070c5e2c0cee29cb48d22ede23b40ed0c9fba102387f584852b37 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/1.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/1.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f68bb67cb06073838526ea11a21da384dc9f4ce --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/1.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107a5a434c246e60133a756e73c6b8ee4048596cc2bba7783a6d68c9e75d5331 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/10.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..418c5809ad7ae256fa08b679e0f8d8cb928b7ba3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4bcf3dc2f2489a8fb36c8cba9fa01c6c861e68df3c7ee29b430ecf82dec00c +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/10.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..066b8fb068fdd79cbe5892d61785713e51d85cf3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af80b8db021ec1ee32bae97dfa1708d048f4367ff0084e5364c4a2116916eb5 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/10.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b89fa75c3bf1429cdc9967066ebf98501ff2f140 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c397f07bb0f554cf57a6d10f14969a8adc3cf948ae6fc0cfbd938ccb643cf14b +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/10.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a33c116b2c52d6471e4ad7c003a81684785b7716 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d92fa0b924c475c7ea1a9b296c939b47d0ae4baf2705b52431d532aa230975 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/10.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..001170589b6f8d85b7c0008040dd8d7cfc4347d7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef33fa51b4ddda1e7fd5ea2eb4c95660900692ade52711155d6fa12436ad8ae8 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/10.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7bea1a28008df3960e85e6ada1cdd7d9953681 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd59f01b8d8ffb674e89153a6701b3f136ad750b08fcee9eea20f7163e0e39f2 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/10.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/10.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..72633bd651d36229ed1b0e87fb1f035fab494914 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/10.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d43b2e086b8f4888df670d1e22c640232d36f761e5e4f2445b4fce39baf8708 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/11.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3956e8740bf67e9c5580419889fef5dc472556f7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d51142650466f1945c1733f32ce3bc426615fc2b5ca833bcf5b3ebbfc4497c +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/11.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..51b8b8080fe45b63a50c15e8307feea955ea27e7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64daaf9bfdc2f630749e0dcc48a0477b9c940611cf0b73f17abd8e7b5e697f4f +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/11.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8789b8a5a5937210c030c63caf9c619e5b0ad68a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdab194f3576dc2e8bec1555ea22043adef5d90f655667856472c64ae6406152 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/11.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc3db7ea010e30f84d3bd452565b551085306701 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e6a1c8f089f6659f7153882c0f02f930690adc7b399b2bc8f2797545043fef +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/11.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7998cba3767a9125c35a8954e5b982053dcdc736 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b21a18a3370694ae8802cce070c9f862b6ddd8e48d5466347f9e14d0c9483d5 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/11.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed013d0d90f8a81f5cd43666ad13f58a1dce57f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c438be510e8402f638bdf816914a0051eb100c6bff85c121d0fd78e781ec70bb +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/11.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/11.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a294f64468b455ec1b0dda28bf68227a3887b39f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/11.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9737c43cbb797ac99f2a405c2c97c07b317386ad2ddaebe7a2aa02f7f3b5114 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/12.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c0998a075f7a7310be717c7edfc5884e615626 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cd6a1d776a52fb75e5185c4f76305c08908382892195c55cb0e7b47aa317f7 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/12.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..934e967074cbf0e73887c137a7fb3e9b73812791 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330110bbd2ca5a94eb54477e9c7a0758234c079e791e0ebb4fa26e410e843920 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/12.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b614bcbb946b9530e3756a4d85c536766bf493 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d9a3c93ef43d1be442dc821835b046c01fdd1922438f8da13ce058bcf44496 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/12.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a400e14be4b3466f24337dc52ae640bec7753f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97248f14a3deecce77fd82b8faf67d155602ad1d1a458016708565e35094f072 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/12.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..870dcbfc4cf0e8b543647fc4e741c077f833ca9d --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec674b9a2a3895780053f3ab031d5aa7c6b83dc33b8d37701ec72ffab013311 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/12.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9345d4627fc84c407872c7e351107c69deeec43 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8e2dd2cfded6b77d5ab1374344c9eb57b2f9a8979751c0d8f64eb897ed23b0 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/12.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/12.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..80041c36ccebc3cd82756d0defed8fd220246008 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/12.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4b143a7e58dfd033891b52f4363d1505a7e801798f054d6287bbb402ec22f6 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/13.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b76ff62b35e025614179c9737a6fbdb3144df5c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04817ce7e84d644615e25a02d3a03d1af4816dfe6d2619263ab71077b063a9b +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/13.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2598f99bd06f485aa06cb3be44e500aa08a2a4b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aaba5a474d8de3f3e34817be0673d67d96033a59339eac4ee011085d6269cc8 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/13.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2248226eb836e6a7deebaaddb6784df4962be28b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c29511e8b3d6eca01d18d3c2b59da3d7d04dbd37ef7ba50eb221aab1e053fed +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/13.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a655af7ac97fd733abad5bf8fd117e37fd0d4348 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc9c4d92244d80837ca483eba02bf234f3bd0ce2e733ebae3efa4de2af3149cb +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/13.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a96e59ac04c106861a06c3e047ddabddf737914 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893a54e443a8c4f4134aad7959fb02dab9ea2b1b9cf315d0478d1b093b1af485 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/13.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf90fee6f2cfd3fd9c5ff394310c23f6575f400 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c74d2f4c9d1cc11a52c55ddb915caba3501ce62aae1fbcd66858fe695f2444d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/13.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/13.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d69f921ef88bc03bbdf127adb3f5818597e7a8ca --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/13.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3e0e291fed495422b91b12aaae2b1bb3c40456dd85542ef2260cd7009aaaf4 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/14.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..235294c7d8ae5db6d78e52124d82842115ca8067 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834a3faf95d4539a4c5a8c56ccbc728ce80b3ee19a072363c9bca26e8e77bc16 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/14.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2934ff812ee5a1d827975c3015d96b1bf5f584c9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e98f577c222f9a04addce3adea8c39784503f898fc63e76d95cb0bbcb68a52a +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/14.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d08d91f80acee7e0f38996f32dffc4d557dae798 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0fc5f09d4b665e250f4e524e21bd374542a03985f1411483dfe4106735e370 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/14.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfa385a390ef4b193c5b307cfaaa225be8b34be6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920ec54e9ef4d063a7696384a33199a2231e523c3c126bb291e6a699d9b77ba0 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/14.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a28f18e819dc4f2865cb9faf0bfbb5879414c47 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf7b72891330aaa2b093e8d1439ca0ac7f382588491c3364deb074b152e087d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/14.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..35cee06d40b4a47f7e4ed7d244fe185174cd9029 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0676fc18bce4edd59f0d4ebc8720ea349465ad886bf85e449ee38d5779ede9 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/14.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/14.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc52e613f55782aafd7ee2993eba60a1dcc6838f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/14.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c569646cbe5420096dca010d659359a252c53e3c6c4178cadec3a9a066057565 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/15.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f34abcb6311cc490e98ce3e99ffa9c323cd7e22 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447c69bc0c544d5f9c11e786c4e98e010bf56ff8949a8c6c41f97d02638d2d70 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/15.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..db871f4eda1a4719d6a54f15a262dcc755c424ad --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f7ef9c7e8bd13c0f7861c33e261d87bc0699798bc74615bcd35dd2dbffcfca +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/15.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e2a7e0a2d8b86880611a03480803fd158ca48b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f2abd329c659b870e37d27f1f39cb81cecc641ce29f6d1c3ef1605d46c7cf6 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/15.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c41395692ad267c5171ce4b02fd785beefad642b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248bbfce616ac2dc6571c7b121c6ed95f60a0749500eee17d3d866fc35a2a0ed +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/15.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..32add2e15cc885b3b7b699f4a9e3311dd4c1b8ab --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a14463245b03c61bf0991caf3fa2da5f0498777786d50ef84f05119e3ecd957 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/15.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6781d97298f5009806129f3722fb809d139931e0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fee06f6d5f556dac8fe9550a9ae96ad9ebe055e1875e9e09a49832acf79f8a5 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/15.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/15.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c76e76ef2298083eb69e61223473d26ac7cf27e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/15.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a8943a379a7b49f02b999cd64514271f0f1c52179cc544742fd32809693c82 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/16.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7722762ec34d48bf5f15aa4b70009054fd47586c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac4091743e38737c88b88358ff5fd60589dec4833e88e038df3dd11e1a9110e +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/16.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f23b814d8c2ce4941242a7e4e1e5125c4be3b325 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afda4cba0585f1dfccbe00ec1290f412c96599cf991c9c5d9b2d591bcb1e0ea5 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/16.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a65e5ea9380b1b5c960b25de775394e289c4ac --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6406c7639c7e57c5fe5f4a22dfc7185cf45ec8869b85fb05047c54d9e22289 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/16.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfcc1591aeaa5a0239ea9c8a39902b746d629a3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c9bf7f22561b9f5843451fad100b37e64d1b06279c56c56d860a216deceda2 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/16.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a770f4b8c147d276c8d51e9d8fb482259d784e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85018ab533bec6d09cc37f403d2a3ecb1e77276a3f77f3f4de89b4dac17b0500 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/16.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e06bb948d4563b7d2e0d9fea42acca573c42216f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9871b730d3131f3e81f621e7a36b071ec13ea1e697cf679063ddc54ae24fcc8f +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/16.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/16.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ffed6cb2fac64141c3c73d71948981cea3bb24a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/16.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a33d7dde0af90bf10ccd9ec76b0ec9ea38e0b188ec446d8a024ba13a6692e536 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/17.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..586595b2f08b8ab36c6c2b6349ab9a9f43d31b0c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e43d0c92f7e50332596127978d2514b094e9e4969cc6ed576b8ce4bb43c2b52 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/17.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43063c1053a3a8d49394d0c66313fc97574aea3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:274199b0bdcf05f992598e56da537a77ed401c7f0660016b6337e6e7b9bb27f2 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/17.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f997a714bb5a72abf01c9701793fcc071495a2c0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa995d0b07f45ae7fb6e9cf88c9e11bba47418ffc1fac4604367f0118616cca2 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/17.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc0ade84d8851446b806c71e360e3627ba71f7a6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e4e964756c33ce1e936174fed7aecb9d182077ba7f2035ae78e9a7e3040166 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/17.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c6aa73dae360b7cde09bf7dbb59da4ae0aaa969 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779cad1f868759f043fcd70b195bd4f97767194d75c635d33598d0feda83f4d2 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/17.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9e85ee8a0f1de90030f38fc74e1d619f726866 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2bd58332737fd2e169a46e9d2ef1ddc42d2f477754af4393e90d6a82e10a1fb +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/17.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/17.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..27aca5e7ec50752932cf8fbd7952cd31455adf34 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/17.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610da3c27629804b0205b1647feb1039c6f6ce3b103df44c1b918e398dfd83bd +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/18.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..398310966de4feb33645c1910afc595b902235f7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd59a016d48dc66003793392535bc2c84a3e49a6e917683130db89b6a1ba0cb +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/18.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..31cb4d4cf7cb8362395432bea8faa004c04fe8bb --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d6b145bb7c72becfab9a88ad29f82841d3a86614bd3ccb996615467b5f55dc +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/18.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff15e6cd503094da90ce1b35714bdb4080072192 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904ebae1d508656c38c87328efdb6a27cd3a96c8c51e8bf00bc44b1959b381a4 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/18.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c3acee80c8e6911bac713a8acf9224946f688e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2698db9a62fc12dccfe0241f8ad51e45506f213f5a7f77b98b87af8bacc23656 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/18.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd567d076fa4d0a7f059e0f1c6ad74621f2e5dd3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ebf723b61316b01b64a69e04962c58baed0afea4178380774a29ca9544064c +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/18.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c865b4576263b35cbed79983015306af9cc96f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af0861bb8bdbd979112c3d1235ebfd80e48d09e96e2b10675b54d5ff60af44c +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/18.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/18.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb1da1376fd3df94d55e6bbde05263ee9845fbd3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/18.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749a43398f24800c6f953021f93c83b86909f42ff5b0900cf1615e36fcd9bea2 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/19.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..74940ee4cdf32781826fa12c1db6b77a01176af8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64af3dfc7ff3a0aeb60b32613c7298b43ced072eae1875ee6259a254fc9d28dd +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/19.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2d70c614ad95325bdd96cc9053550537dd92508 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c053d6602e2ec0b89bf0701e44f028418495ea9f16592a29a3e424e4907f34 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/19.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02d18cca3652f6f0484822cdd4682d774102e26 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa630df0bf8824b683f2a5e92d6028062509dd0d9abf4142f9470af8e547d2a +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/19.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..09569586a8657b9e850060a5b32437952f490a75 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6154adc8afd04d757b72b6521b0685b464087aa81368e31c8d24ef31b39e4286 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/19.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..907a7a7da0eeb88d7639ae14cfc5c9d5846544d5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b518ea34d4ef86c5f8b1791d76fae6f7f683fe876c95d72f2b43f4c6fcdad731 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/19.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4fe9e7705fcc6c36c7a8547c003b0e90ba2de79 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82aedb820ee500ef8ed2d0ca12bb44341fe2beed1b0131b6bc21379e972ee7cc +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/19.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/19.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..db848ad1d5a4447af165a57ae064b047b644733b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/19.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4388a90e34e2efb0b08a6c703a6aa02dd855ad43d9377758007c81ca8666c3b +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/2.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b855c246dcb61b7032b3ef692274780dd76ee7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57fc40aa8005533d07277fc410bf10de7c1d3b21736ce165ff7b01ef4fb8fca0 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/2.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb8c50dee88a7e1d792dd7987c7844b72dcccd9b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92f0a146f2cc7d54a6019b23217ec31e834c6bf410059a242ce05cb5e220ee9 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/2.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0db94dd4df5981df75c7510f9c6eee4ce386eeca --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c3fa707ea596fc15de419806422c35cb155c04d1a378cbb59c9a03ccac2eee +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/2.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0e1bf3c25875097ec9947be98533a54557c4a5 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8ded4bf74da2dd53ee630fa33f01de431f93c70c69134a6782bb7e59879332 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/2.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da56dda4008b4b60e1d8ff5612e36f171b94092 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69527e0bbc605ae5cb29527685b8f68d9d5914440f7a0b2b61faad3d7d098e71 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/2.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df016e4bd64e7b06785882b4eb07280962bdbb0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a7c4283aefd8ce9b7fb282e3c8b3e0a16a983ba5c02ba9a0ace05fc0420953 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/2.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/2.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c2b8bd62c4dd17076bee1de5b8bdc4c91102f1d --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/2.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6deda1443f54533a9acb44c16ad15eec0d2c763a21e2a2602ab2988aa24118b +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/20.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..be9ee2f839526103bffb14dcfcf3289d527f7a10 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde2f1983c790b003139cc8df66b1b643e716e2685927b05bbd42ada338a49ed +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/20.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c5b848916d21efe5c149d2ba86454c5156866b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea591526fdd48f445ddc76ccdb1253fbdc03d51ff4b84dac6c7c72ba93ee813 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/20.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f2d4ab75344fd1e9c9603167a2ebb146d488aa9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61297d57c9e969e65be52cca3ca739d43470dd0686c1c023c8f30580f48bf14d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/20.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4355aba1e6c35a26d9f48d902eaee288a7f1c72 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c805c28db5de09854bd62506f9a5267276143d7f342e804355368b2ced2b1edd +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/20.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55a976942e48ff7e61e3a38e739e501f67e7265 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72dc47737ce1733cd8829a7cefcd0927fc163f363d2fdee2dc7848914dafa8b0 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/20.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2990edc07f2db12793fe46f7bdc41da1c7e3fc7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1fac5bdda49e150491591bdbfe4d9bcafb29279ca1ca307076e53b6253a178d +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/20.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/20.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd16eed322024fab8b7f7bc93329fa00a2b5f585 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/20.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f378dc08e674e10382bd8821ba497f3fad5cfa2e05b07c74d9d7f0fb3cf34ba2 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/21.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32e802c319e23a52a46134c39f1fb2d05a0de60 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd3f1a4d8744548d39c0918c4dc8ad6b3ad96eca1c3529a0cbbea2440841f93 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/21.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e75ebb87b115400cac08af9dc2814e71979b004 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c77a89695c8db9fbc1ad33851c79de44e7111c91ba1394fc77c84f861d1a03 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/21.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2532a95965642e79e1998d1b9f0734ebe476be99 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a0a6f3663aea47ea6031ff4b953f88ad962914289012911652465b93e5cdfa +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/21.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fcd351e6978f334aba109fed7c3d943f079b01a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:759085cd496e3efbf83373abe79c06c9a6b2f6682431a491f12b22ffec8e7f76 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/21.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c50e18a7a71ec4e36d1288c4639fb0dc8ff568 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f3be1bb8228b99bff43dc619374d5a7084239836fa5a9c11827a2f8bbae2937 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/21.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2803b7e274982c48a9a4b7dc18f3a40b4191f9de --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65439eac4801a9f517c3e6315e43cf1f3537bc59ef07229343bce6356d5f35a3 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/21.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/21.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5811816d1ec9bd64a416e58af3c82ea9098d45dc --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/21.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e81d901ee79dd62834ba60c4fdb12612f92de08e0896687c393986e7d07dd0 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/22.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..033199095662b8c89234b3b8aff12b0ead6ba412 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fffc960baa1f61430fe8e184d713ec8503793d39794dca21dcdfdb2dd7d43f8c +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/22.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a389346d4b002c8c96d57d6bbe0c36cba5759173 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c18dd6bbdf390b725f652e43c6c795158a20608824c1e01a3121129f8adfd03 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/22.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..23e0fe5a3dc2ec9b0da7e394384143e2fb6e338f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e85a9ca2ab0464b41e69fcdb0c3c3fbf4236f3886445b4ddfaa93bda8d756c +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/22.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8dd11c8ba38d49c614999fd6544d016665f4507 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22bd53047c4fca81f2ff0b91acc3ea6a3d1b30d64fda1bfd914b8aef1444b564 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/22.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5cef6e8e7151aa7d8e404251af08ee1b781fa1f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d9b9626fb6e9167c002608a7e2239b27c64ce510019f0a65b4ac3e0591034c +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/22.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2442279904fe5c2165f910c73a5acb54f0b73f33 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc52122becf90ce6478c773c17495781eeffc4028d33c1e200fcd23bd13b49c6 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/22.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/22.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3750dba12daa21c2a8d6384a62830ef0dff915e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/22.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bdbaf43e4b68cea3372be3f6dbf571371da66fb90017dfef4ca598bc1d8e81 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/23.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5679999a00f62f84dc066a8d2e2fd333cd422c4b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef55a12279de5fce68a1b4e22b7e96895289fb7621fb57ea5dfb8ef140ec6324 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/23.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a6d85e8d27994c6c9449580fe70432e6b1edd2c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6c34c8dbf04ef664021f50ef7e0f640dbc53d7c717997abd7c90effbac89b3 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/23.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..47ce6da08dbc51de2823e56a3494525fbb364482 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f3fe596e0eaa6db253e4efc77ea6e2a5937c571c033366c478c86b2347e30d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/23.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a646db8a637ba7e52145b818e41b495fc426449 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff3f8d5a6bc827765a6018477a7fdd1e8a35f0f696876a9551be963d8c427cd +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/23.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ab6529cde7841d70f8ebe71e13745ecf8fe4a0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6237c036e071719b5274d6dabb78e9a5d01b48b60c93f12dd454f237b3930d79 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/23.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3805c657991287352a7ffd834208a9ec4d345c7e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69bc2bf2effca3c846de94f49d2c08800d4bf02a4a9faf30e98dce7684540988 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/23.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/23.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b51b5695925d9cc0992ecb5c6e8f3df7d4866d1 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/23.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b780476c223ab894ed5caa6e1750a0f807084f175d70f9281bfd1862a3bfd257 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/24.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc0d3b13e0f14a00379ad3779a258f25a1417c20 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e01e8191f15214beae7ead1dd872a20c1ffb47d261e9986cf9386053a8d5ac25 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/24.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..56f61405adf9fe9a388e2eb4744c652db534b177 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26d27f11ea4b5dcd984d4d321f3789b4c746bba5e20085ca4ba7f6c57ae95940 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/24.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d9a97ff366fc0a5d37cdec3aae73941f02f34c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175c1e5c3044deef174dc0fdd9fa3b06d668fbe22a8368d678b42d75b421012c +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/24.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..936fe2b945da5f180ca8f17a04b7da094644f505 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2c114295d06e2a22d0678a111257aeb265cbb719966e08e74cfa47cc995165 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/24.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..884c793c7e246ecebaf9c8a29117f43c3b9cb6c8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b3fa94bc46e04cf7e9428e3b6ef96b3817250a949af44d5b60c79fa24d67c2 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/24.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28fe4dc1d6b6277188bf0f7b682b0e66c9111d4 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07c1ededf3980e6bc7d577149a11e152b35429b04a14b2f9a7f7f9a99a14f66 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/24.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/24.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f3612c3b88c679f313532099ad1947ba25b85d2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/24.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1abb83e57dc0dcd4bef2222911f325498d674421668b4078efcc37eb5585dd1 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/25.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d56f4358227b0276bfe77d0847414b7ff8e7d3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9120768ee5a466239416f80c65b9610be53dcb325588c7eaa20447605b0a7c4b +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/25.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..234fdc1f10b8240e0f4bd9316c8721223a58a67d --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6741316148cc630c1d9a6e675539f0059afab825f8ce837dd821abe0f7ff72 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/25.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..779aa13b1817e3ee1f70b8ecc5e13fe456fb68b6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f96fbc05a18cc0d14c04d2d99cdb0eb838865b02145dae6167705c65c6fb2d +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/25.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..07182d7669ad236217b48e5ac01a773e3b6a11e6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1fbff90f8bc337b93bd52a034e13ad86924e82fe61e305f9f6527ea20c9956 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/25.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..23daac9f62cdb2a73dd641f6aa6dbea20194294d --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c5a0c36bc565fa038df8fc267918e72282c72569b55006289a2c1de17b3102 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/25.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..abd2a1958230f2aa0507e73ebbde89a8f02c47f0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ead4d9fcb644cd74ab6bf17526508efb60e786eb958c4f19c5eb101215afeb +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/25.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/25.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..40536d78c3660b450df57bc46be55f5858503837 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/25.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:277601c29e4f0ba92a938252eb3e65a10c9fcbb2aa977c9bf2e4e8521b6ae03d +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/26.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf09ff7faf011aba32c3368eeae22ff7ed243d35 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:002b812d9ef74749f24b26ccd9c4bdeced8bebc993a0b95ddf021421ce74ade0 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/26.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aec03998765ce644b8c1ec06e5adb8f63a16f66 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a20ba24cd05eeae8c989984500ace8a9e41f0744a5abc000266602513609e4c +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/26.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebf307c450f8cd7214a3da1b65c50c7d593a1a9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eac0d6e77efd74df9078ec08612f805f185d009d51886d05570d5ca1bafbedc +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/26.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..36706211d648fe215d9b875e890480c52d7195d3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa2fdfd5e97777dddd4bb14ea30cd9fe71ccc5472c163da2ca664b8b16be676 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/26.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..78255ad0ac290bf153133c082f02468b86d5c575 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f22fa0a80ec532399a13d10d1b0e61a724bbd11835a5a3754f71cdef87629e0 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/26.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..114e9a7f3c0bcc5e352b0c378d4ec1007c18f736 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70185d0befde6660cdbcfa69c6448961ffd0f1452e7dd3c51ab5be8a61e4057 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/26.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/26.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd67dbc77a2b01e2a2abb4e5a5ea8b16c1d5cf8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/26.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16b8b8d2d3dec3031f3fe2b66574114364c87ee1dfa35731a5c8694eeecd58c +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/27.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9d1744aa2dcdfcfa9dc85c6126de208b79c6d95 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8979804daf643fab2827c1171360a433f5562c16bf4a1634f85a696e807dbf17 +size 25748391 diff --git a/checkpoints/Qwen3-1.7B-Base/27.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8efa82bcd769de6a5395a6c18f8b2083d134325 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61737ea06d32444b20a8ad248a211806de36e26260eba81e7d66c2d7787c2c8 +size 25625511 diff --git a/checkpoints/Qwen3-1.7B-Base/27.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15b9dd5f95619d9ed874f44c66cd17b8bc50928 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff078c779a70fac4395e3e86183878aa5b3234ff93331744f0360e8f8615028 +size 25625473 diff --git a/checkpoints/Qwen3-1.7B-Base/27.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b03055118404f7ae9fc43a2a1e60d27fb652b7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808bd840f222ffb1a37142dcd817b9c7d194d92d1e9e81c5391c42e2908bae1a +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/27.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..87f4491fd6074ff9abd9f9daf6fc213090dd0856 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c416f1a703693b2beb325ee65e971ff39d1b75e29a15881333ad78253411b46b +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/27.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd453beedc48fcc89eac7750942bc977f83f38c8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5223dbbb1f395d4baddfedfaefdc5feb4aee51f8b5dfd8f9a4fccabf7c787480 +size 8586208 diff --git a/checkpoints/Qwen3-1.7B-Base/27.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/27.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..13cbff6b486e55b4556364642f691f12ec75af33 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/27.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702f93569fc42394235ecc1de2b337dabd819ca34415bc9ffeb5942047d7d159 +size 4326368 diff --git a/checkpoints/Qwen3-1.7B-Base/3.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..567571cbd039e193007ec641e956767c8e2a7dd8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:471059277edc0ed6df8dec4e0fbc415bf39e99627d16b580a08ffcd1009a8fd1 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/3.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8438bed414de7826ed33a4b02c405a1aab5b8f0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0081370bc616ece4c44a58b3aa63f403e2de37e0746838613257063547a62b2a +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/3.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c18427906fe2720a1d39983be212d70102c6e80 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3550a27642b606fd45e3cfd5a2dc9ca2692ffd6c612628b8011540f73dd75370 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/3.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae9a9388f04aa4220cd688a450a6c0047335564 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f9b0740aac8da736c76e03b4cf33ee195ec19b6635bca96dfb9ecf7d606260 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/3.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5f0ba85335ee60662eb382b1551415919236d0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6adcf56dd31d7be1e4793e1480e1f672458261acbe5866129823b2bc3b1d4a0 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/3.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ee97c29b6a49e28ddf29af3e50a1a24418821f0 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81c5bcb3be814dfa1b713eb4dc5910df4d0444d5126e6ff7af95324bbe25d8c +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/3.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/3.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..328c04b954fc8ae75b5db83eda5014e2b12fbc16 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/3.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3846e30d55409dd640543329a15121605a2a200a48c9e4e9fbdb3786bea837 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/4.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb0e3d4515cd91ab9e2bb4fa31891aca457f746 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd147a03825166064c525efc9e20389e8f4c4c8ce4ddf7fa2b662595d87fdbc9 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/4.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d40548de3dcbb9f4c520e2ac5ba8ee850ad188b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cddeb68903159e65390dfc646d7f25e2e640f714d084f920870b290c64688aa +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/4.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..92d6a6fe4cfa96391a46da174ba0de323749ae1e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270066827ee3221e9fa30c8e24b0ed2a8ee2a239f69f3e23eaab1a4df1edc989 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/4.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6508bc22b84c29822852daa0e8f5ca19247ef63b --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dca798c9e0727b57f278ce848a329ff70c940870e35da17b94cd8d6d5c47b53 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/4.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d741efffbdd329638fbce29b018e4c64a0f711 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee2b916ce8c242902763751da07f111a187cf413a041b863228e65e22145b5c +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/4.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d6e58921cf453707e02f124c9f905667cde1b8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932b974e53d14503ca7dca7be4485fdb49b1ee6897117f44a5c849321f3bc678 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/4.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/4.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e295498cff5d0148dcc6c746ccbf3b95d93e22a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/4.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb175c3a9aa9b408b1c551ced44c54d42f9f08055d2a9383a63ded86cca23207 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/5.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3c8d9c6e40aacf2f39f0af72f31ad3fdaf9e2c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cde2226cb98f054901d1275566d0407696b639285211b07e828c71b47018805 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/5.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..341c9f5a0cd5e41e57368d4e97ed77202567e08c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa70ef3658fda381ff42ccfbb2b097bb9665689f3a3495217635ec96919604b3 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/5.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..56fc6220201e14500dfa883bd46a3bd6b8c8a504 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f23ee26d35458cc20201cb5fa8a54cb3ab39e5b63fc0d54fdd44af648d93452 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/5.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..e19e083b4216e58f0ee30186fdf1d0d5830ee979 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6707b94bad1f4123c018f46c6932497dc05abee11f020df4c3848a0c92814e34 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/5.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca69163de1efb410c233fb8241386176858bf281 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a71f80b5d98780621ae2e70addd9b4bae69c580de25dddbc8850c3e3821f10 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/5.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b651fe5d8cda14ef551f8959860081882396819c --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fd6a7f01be724cc5ab46a7ac87050e2b510c76534ed4957fda51fcb9c678b5 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/5.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/5.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad2b8cad74de65ecdb3031d70d0bbb5e419804a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/5.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccca3474f782f49ba4874f89bf84e42c85bd20071d0b01ddeeee25cbf00828d +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/6.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c6a3ca6f4c0c886ca66a4d4c42e3354d921efb6 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009cf6fd151923a561b19ad3d4126aa17a35465f202ec2bda6e7797802afbb6e +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/6.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..b895e6124498ac010bf6afe60b1e41834f92b420 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f8d723b958a7c95a4dd635df8c9d32097f3e3de72dc50fd292919e09b06462 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/6.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b35d6cb8ef11d9e316ac0784e32416f9425d7dd --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f04e8c9e1792e4db41b191db8d87d31430ba49f18a2d31a0d26e16941b259bc +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/6.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..de444a97063fe87a098dcc74e48399824df07cb3 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4de5595a099572bbaac927a5a9e3087fbf569a999fe6d62db5c268b72d4a55d +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/6.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5af6d0b0627ff669110e24b06b3f89cf9d53b7 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d473747d40504154c5e85da7d1cf9a74dfd14e04ce3bc72a82f2ee7a33187c3 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/6.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0cafeef5251c64e88f8e1a6660e785c1573d4e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b0356c622b42a48d089b980b8fca7a9b65545d59ae824209652acbeb48fe9d +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/6.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/6.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa193e9e246b71948a3b36d04bf18e80fe9ba605 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/6.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ce7755fbff1e38f64c25290f3ffde831ee41968c25091711b2744f8c5611da +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/7.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1479f5d618bbf1bf30cf87e15cc52a4eacd3bcb --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071418aef8a0a1465976d8c0e7dfbb67ac4093f104329d2c275d5027b3544c6e +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/7.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4472be7c04210c1914dad3afe55aa3f415ff93 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae729ebc2a263fa912c13ea2a20aad43e1a36d01b96208e7f11dd66d3b9ec5e2 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/7.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a73e2b22af34faa198ccf92e6e8c3eadd5720bc --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f388aa441a7dfda0e44eb119a86742eb1bc565f19adb075d24f92aca0587fcbe +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/7.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f141b738d7272b9edae74f4a0c8ce041ba50a8 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8825fd0a36fbefa0778fb028bb099cf8506104a8cee9bd15c6ab4180921f9d14 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/7.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d3a846a6dc48e7605bb303a16c63a07eb360f7e --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653b9a9577097cd9ed28ec589502341014ce0800f4dcf220bb7b2ebdba361879 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/7.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..16fe2804cc0c64b962b9950df9962c6b028c2213 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d265663b8ab0c39ce17cd84bb4ffbb9397f3e28303b7d134a09e5ed892b24020 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/7.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/7.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2897bb9d9a9b00e4f93dd899fee02b8ba3a2148 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/7.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddfb6829f7fabd18c1efeb067422a434eaf47d5bb42765e2ad8a049ad15e9225 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/8.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..595acbad55e11c6a689d545062422cb1e02eb266 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cdb3224f5952d62e630f4cd99a30524c4da2876449b25177efa109dd1252d52 +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/8.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff1610f65b2333827c013a26c8f66cc1b6d6109 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a558c62675cbaed4f2e8fe65c7cb21de68a5b3a5f207752495c7cf5375b156 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/8.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a37b3ed42fe8525ccfabeef9d430c41c8757f5d2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19578b9ced95107d1fb29b9690035ed5122f0541e6ef7fad04ed95eaf4fdda4b +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/8.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..c15e2fec63e0dfe84aa5ddf798ef18899909e917 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed8c32899a0ca0faed53607f4856bcbe19923e5283bb69d0d8655f4551b88b6e +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/8.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0d9bf4623bda3f2390d322776d6482f22c89b9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbbd836735be29775c6486e5b566dbd6ff1493981c9451199639287300e6a3db +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/8.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca81b2101e514afc6ffdc39d6c617aa300d6449f --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27db10669c22b9c6e01d89073fb06a6413d6d313ae430fe86edc0154abf44e68 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/8.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/8.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa2d89bee45797387578a667346b480eddbd89b9 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/8.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4288f23ee0480e5cafdef70c6a7517b8e71b124e65dbaf05661ec87cfb190ed +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/9.mlp.down_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.mlp.down_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..16860b297f8c7228e6d999ed931f6adaf330f127 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.mlp.down_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d9b17126a59b8b4477be3124fb177f6512887345fa8108296d160a0763c730d +size 25748372 diff --git a/checkpoints/Qwen3-1.7B-Base/9.mlp.gate_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.mlp.gate_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ecf3dd07e10fe77b4f63c734b2842ed1bfbc92 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.mlp.gate_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1979e770193b78867f7bee69a8cd3c3645e250af00486b51b6727705c6a86bc7 +size 25625492 diff --git a/checkpoints/Qwen3-1.7B-Base/9.mlp.up_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.mlp.up_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6c0a4fe7d34099ebbcf1908b5ceec0f3f62b1ea --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.mlp.up_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e1c246fc54d73a6d091e372c4fa391d981e703aedda06ee08771129a1493cc7 +size 25625454 diff --git a/checkpoints/Qwen3-1.7B-Base/9.self_attn.k_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.self_attn.k_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea760aef8152ac7db420e0e09cd52b061fe824a --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.self_attn.k_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f45a8de14387642672c271940a82f751ff8ef1988f8ebc21d1b94268f2929a8 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/9.self_attn.o_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.self_attn.o_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..cebf0afb60b1d7dcf84cc1c00e1a501dc9b471b2 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.self_attn.o_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652a11d738ac6dd52ddc1e6a018e080565c6faa40c2eb5fc39d7935fe0cf2c27 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/9.self_attn.q_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.self_attn.q_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21f5257573c7b7c77c636b9b9008687f6e71c18 --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.self_attn.q_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b00f175b0e285e457642c5348eb1c09d7d7d0505ebed069655d4d63915d8fd2 +size 8586189 diff --git a/checkpoints/Qwen3-1.7B-Base/9.self_attn.v_proj.pt b/checkpoints/Qwen3-1.7B-Base/9.self_attn.v_proj.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcbcdb33cebfdbeef84ddd037581485d62ef14ac --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/9.self_attn.v_proj.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a810f24302e470b82b8ddf65f78d6d5db266ffced44171e766076de3352fe693 +size 4326349 diff --git a/checkpoints/Qwen3-1.7B-Base/args.json b/checkpoints/Qwen3-1.7B-Base/args.json new file mode 100644 index 0000000000000000000000000000000000000000..7aa3d548174b21cbdf9d0f5654d3cec69b467fce --- /dev/null +++ b/checkpoints/Qwen3-1.7B-Base/args.json @@ -0,0 +1,45 @@ +{ + "model": "Qwen/Qwen3-1.7B-Base", + "epochs_list": [ + 10, + 10 + ], + "early_stop": null, + "weight_decay": 0.01, + "betas": [ + 0.9, + 0.95 + ], + "eps": 1e-10, + "loss": "smooth_l1", + "q_group_size": 128, + "n_bit": 4, + "params_to_optimize": "channel_scales:0.05,angles:0.05;weight:1e-5,quantizer:1e-6", + "use_scheduler": "True;True", + "sched_freq": "step", + "datasets": [ + "wikitext2", + "c4", + "redpajama" + ], + "val_dataset": "pileval", + "train_size": 2048, + "validation_size": 64, + "batch_size": 16, + "seqlen": 2048, + "seed": 0, + "use_og_input": false, + "shards": 1, + "results_dir": null, + "resume": true, + "layers": "all", + "output_dir": "./output/random-pairs", + "init_rotation_params": true, + "num_rotations": 8, + "num_pairs_factor": 0.5, + "use_kernel": true, + "checkpointing": false, + "reverse_pairs": false, + "random_pairs": true, + "first_n_layers": null +} \ No newline at end of file