diff --git a/3b_layer0_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer0_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..17040a572bc23898fb6e2312333c475283dc58f8 --- /dev/null +++ b/3b_layer0_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b66d4e59002bcdb5c16bbc84a3cfaa1091841592b3f9f028fb352206f2b57c +size 92585543 diff --git a/3b_layer0_mlp.up_proj_output_reasoning_representation.pth b/3b_layer0_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ff59202dc3e68d6116b8dcf9290300c1c1a2ce5 --- /dev/null +++ b/3b_layer0_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cde8f43ed84db370ed797469b91bd9475dda49bab80ef85444ee2e74e070020 +size 246892034 diff --git a/3b_layer0_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer0_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..880565df514d99620a7689b1068062bd47ed75c1 --- /dev/null +++ b/3b_layer0_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551c286f0145a650ff7287a5f7aea4eeed631b9d2bf4e1efcedbc15dea6e3fc3 +size 92585558 diff --git a/3b_layer0_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer0_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..490ebbd55876ed2538b0db663ac7961e8b2d8d6a --- /dev/null +++ b/3b_layer0_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01854c3bbbea741055ae31e858cbef92f1239bd74d8c2d07c75d800f7cf2d912 +size 92585563 diff --git a/3b_layer0_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer0_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddb5830f0a4b9d3bbc619e6ed781883bc2862c6b --- /dev/null +++ b/3b_layer0_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9382b92823afa844b42cca74a45d05be52ff236dfb3964ef0f4af89304e32b18 +size 92585558 diff --git a/3b_layer10_mlp.down_proj_input_reasoning_representation.pth b/3b_layer10_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0ad3f2fb6f7d3b57f7b6b96343c9ddcbd911ac3 --- /dev/null +++ b/3b_layer10_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:356a690d2b181307bdf8a0d57f4e9e09622a5fd285434ffba857e8c57d39752e +size 246892108 diff --git a/3b_layer10_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer10_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f625cf83bb25d4d0013f9cf7169960641cb0fdf6 --- /dev/null +++ b/3b_layer10_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c767890754b732970ff2b77e14860eeeeeed3ba101c883fe9b773924ebcb5b43 +size 92585548 diff --git a/3b_layer10_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer10_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d0bd2bf0e92197f06ae79d58b9e5d79ea993e6f0 --- /dev/null +++ b/3b_layer10_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e9d2cf3550749b62a806cfef9482bf7022eb9460a77046cb568327b055a9f8 +size 246892113 diff --git a/3b_layer10_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer10_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c539b5754a08aca16935be45f190916bf7b892f2 --- /dev/null +++ b/3b_layer10_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce995c1f5ec5ff3bf2e28bdad9f179d5091677bba41568bd55545c3b78198a6e +size 92585563 diff --git a/3b_layer10_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer10_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc2ba2504e6b2bc9fbb26f0b64923d8a27f71b76 --- /dev/null +++ b/3b_layer10_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36589b381c5b96eef1891f029537df304ff71ccb6a475f1ed450ac9d6b31e2f7 +size 92585563 diff --git a/3b_layer10_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer10_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..716e3a8386c1f2be2358a74390035b3f2c36b14f --- /dev/null +++ b/3b_layer10_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0578c202f0ee89fb7b9567ed80a8004e5bc1b7f80a390f2637ca7730da1786d6 +size 92585568 diff --git a/3b_layer10_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer10_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..187bb14ab7e3446303b24752fcd5fc323b7fe9d7 --- /dev/null +++ b/3b_layer10_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be0b73c378d3f4f04eac190b13a2a4cb71f95571c55d1702d03566f1e62bde70 +size 92585563 diff --git a/3b_layer10_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer10_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f14cf28c01c6d75769c697ede86ec594f7a3022f --- /dev/null +++ b/3b_layer10_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa43aeab9e0c5b5f9f35be56f21feae2c9127914f9c9a670c7f8aa34c116e625 +size 30862944 diff --git a/3b_layer11_mlp.down_proj_input_reasoning_representation.pth b/3b_layer11_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..db4f6cb7309d114fa6545f2ff29012eaa6fd4d36 --- /dev/null +++ b/3b_layer11_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa09f50ec193e72f1becee5cb1b937fc02d4b1c046f31592a77d867e116c2e4e +size 246892108 diff --git a/3b_layer11_mlp.down_proj_output_reasoning_representation.pth b/3b_layer11_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa87f92a3ce3452e116f438304d83fc34e74a563 --- /dev/null +++ b/3b_layer11_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cd077207fb8b8b8e3d33aba6cf1597ae8d3f41f810a0a5d7f7de2ed2b1ee60 +size 92585553 diff --git a/3b_layer11_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer11_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a78412a3d647b5ce76e4e33ab8f3c050bf6f9b9b --- /dev/null +++ b/3b_layer11_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea7d23526bb8d5f0b02e1880eef77dd4d00c4f40bc5ae89883839d49bf313fc +size 92585563 diff --git a/3b_layer11_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer11_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..85f1c11491ec65d530741aaafaf978d773c1317e --- /dev/null +++ b/3b_layer11_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43cb1294fa1a2a182d7b712f2383b4e08b7c828852d3da8a2dee12e039db06d3 +size 92585568 diff --git a/3b_layer11_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer11_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..00d523ef2e36a416b9a2cfe0280a90f882a80194 --- /dev/null +++ b/3b_layer11_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956cc0eea2ee9be976380e595e1e11880319fd81d8ae39ca7aad7cdbb168d6f2 +size 92585563 diff --git a/3b_layer12_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer12_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..545075e539ec874832324ec922b5b6a168bc98d2 --- /dev/null +++ b/3b_layer12_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78476e420e4865b9014eae7dc1daad3d305b82252b116c6b36f61c6d68e97617 +size 92585548 diff --git a/3b_layer12_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer12_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2e054946145e61cc0a2949a24e4cc7dc151b0e6 --- /dev/null +++ b/3b_layer12_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3d58b07df379be01588adfa2704b633b953f8edfd8b0db38f3219446ca433c +size 246892113 diff --git a/3b_layer12_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer12_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..496484dc631e62d7a30d04c2b7d9d27c906aaa96 --- /dev/null +++ b/3b_layer12_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01fd72138e738b24e73c402a9b000d783b1a9476e69aebc8bf948f8e9ed5f7a +size 92585563 diff --git a/3b_layer12_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer12_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..79dd11fd9b6b208381b5a9bf4d077a46168ea076 --- /dev/null +++ b/3b_layer12_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4955b336fc5b4888760eb1db65df2038f84125c078e38b7a6ae6fea49e9a3b7 +size 30862944 diff --git a/3b_layer12_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer12_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d6e2e846d8a2e8f4d53f738d5484ed5c22fe2c1 --- /dev/null +++ b/3b_layer12_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6135e2ee040bf8aa82abd223dc7114b9b5c33b88679507a42fce8bfc4c66e08 +size 92585563 diff --git a/3b_layer12_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer12_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a68ed156726e546a592491730fa826caefce693c --- /dev/null +++ b/3b_layer12_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a7f8a80ecef30b618cb0dfcb931d7e1024154b334d8bd6bfc97f4f79ceee7fa +size 92585563 diff --git a/3b_layer13_mlp.down_proj_input_reasoning_representation.pth b/3b_layer13_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad5d1dfecbb680e41cfd48bebbb254ffa948aa53 --- /dev/null +++ b/3b_layer13_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:542efdb87938991c95da06c76cdd3cb977df68aa10607979bf3f5d145332a251 +size 246892108 diff --git a/3b_layer13_mlp.up_proj_input_reasoning_representation.pth b/3b_layer13_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d0a746967a341e4a38214bfc1737f77f8a1369b --- /dev/null +++ b/3b_layer13_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779f8974ea94c355a2bdaeed286a33c0ff32584a848d3c586f3002ceaeff2081 +size 92585474 diff --git a/3b_layer13_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer13_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c609f45b9aa7b5233e0e42d305789b7c7038d42c --- /dev/null +++ b/3b_layer13_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c6dc3ed095404375f32a3d30b51a8fa12613b00322ce8365f90c61a2022713 +size 92585568 diff --git a/3b_layer13_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer13_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..781b00292c47c85ebe7a6f8972189ad22b31472c --- /dev/null +++ b/3b_layer13_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afffd9cc4c2dcf82321a71a6aaa22dca7e38216cde45ffcb15c1413c960c8bce +size 92585568 diff --git a/3b_layer14_mlp.down_proj_input_reasoning_representation.pth b/3b_layer14_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d8e51be88144b2df17317a03059723f3ccc6d505 --- /dev/null +++ b/3b_layer14_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e829fcf93b93715d58f2d540288eedf30a984f3c740f3001ce576abcaa77779f +size 246892108 diff --git a/3b_layer14_mlp.up_proj_output_reasoning_representation.pth b/3b_layer14_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4027af5bb71aa80eb0963e73b7aab052c9f9fab --- /dev/null +++ b/3b_layer14_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006e341d3845a58bb4b2a7804a5b2a5f37c10f1e6f9b2613d97c6f971e897ecd +size 246892103 diff --git a/3b_layer14_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer14_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c507fd9e10ca094efe35c3dfb06099febd10d0b3 --- /dev/null +++ b/3b_layer14_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49dd3649ebe2f922a3f0ee3a17d3919eab6d1855affcf1ef3e4c7d539160ff6b +size 92585563 diff --git a/3b_layer14_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer14_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce2694a1037a553ba5e610dac370ff2f5cc2df9d --- /dev/null +++ b/3b_layer14_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c55f7cae047e9865895a3044f170a4db8ab863c5e24244a6ed7201c9a507ddb +size 30862944 diff --git a/3b_layer14_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer14_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..203a71021e595f1d9ec162aaf1798e16e89b675f --- /dev/null +++ b/3b_layer14_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4616711f27ef89f86b8c32f019c7301af8a9279901cf3970a925f934eb2fa653 +size 92585568 diff --git a/3b_layer14_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer14_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..866b8bf0ffdfcf26945eaa72ad38e2108f5bc37b --- /dev/null +++ b/3b_layer14_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b8f60cff06bc947959e8ff696f3340093b18b6e0787f7a1fde4894d0d2c26c +size 92585563 diff --git a/3b_layer15_mlp.down_proj_input_reasoning_representation.pth b/3b_layer15_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bfa91130ff280825ebcba73dcbf9537d59046cf9 --- /dev/null +++ b/3b_layer15_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021f37affc7ae45f85a3dd53cfece443b7c1c62409275240554c58d14696c2d4 +size 246892108 diff --git a/3b_layer15_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer15_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e98a9a50d20d704c50efc1d64b35345fcb5352f --- /dev/null +++ b/3b_layer15_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e9519266119a2a1c44394bf2c4c0313e47c578c222816bd7f47508d03b786d +size 92585548 diff --git a/3b_layer15_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer15_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ef404dc45e10b81ababde2fe35bc5684d740fbf --- /dev/null +++ b/3b_layer15_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e2248d63885f0340310f64979313fbbe5fbf69cb26ed2d035191e252d6c0f3 +size 246892113 diff --git a/3b_layer15_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer15_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d674e3f15fa8f1d5da6157613b43f86a649b2821 --- /dev/null +++ b/3b_layer15_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73fd7fa157787a64e533b1df356ce26f0d6e08aeeb7d0cab3dff14450b6f07d9 +size 92585563 diff --git a/3b_layer15_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer15_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4232bf92d0ed9d8a67134042d899789a2faf62ce --- /dev/null +++ b/3b_layer15_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ddd5f5e8ae9a690eca0ee2e8cbcabbac21d586a7a502e6f8a6df2a8fbe1578 +size 92585563 diff --git a/3b_layer15_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer15_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e3034e2fd66dfcd8905d138ae9a72f0a026d259f --- /dev/null +++ b/3b_layer15_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ffdc75430676d23ff0d1864459e758725f354c939f66ebe29bb64c088f5a59 +size 30862944 diff --git a/3b_layer16_mlp.down_proj_input_reasoning_representation.pth b/3b_layer16_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e5eef1eeeabe0f6231bfa8ac2512bd8262e8687 --- /dev/null +++ b/3b_layer16_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd250f7738c7013062b969080c9bd44e3132c13b45ae22046f755675828437f +size 246892108 diff --git a/3b_layer16_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer16_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad13095b320f7ba64b7d67689e63909b7b2ec05a --- /dev/null +++ b/3b_layer16_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0801768222f56c59de43bace11912e82014ee9aed33141391135813273725b1d +size 92585548 diff --git a/3b_layer16_mlp.up_proj_input_reasoning_representation.pth b/3b_layer16_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba75c2f458ca51a2bc463579990705d7be39ff48 --- /dev/null +++ b/3b_layer16_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f8e57c705586492b165d3beba17f976094cd0e4f57716279c83bd2a22300c22 +size 92585474 diff --git a/3b_layer16_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer16_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e4efa84586b728199e2c1dffba4bc0e916ce895f --- /dev/null +++ b/3b_layer16_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbab3018868776356fb8c57c9dac10913bb97708bf35ffded264e2d4bc9773cd +size 30862944 diff --git a/3b_layer16_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer16_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d197b77ebc6c396846f538702f6937b435a4a879 --- /dev/null +++ b/3b_layer16_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95a04623889360f95755839c06517d981cea16ad3ed46b345caee1289b1de58 +size 92585563 diff --git a/3b_layer16_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer16_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b35cda2d5a32801fb58e7806ad07e1b211170fc --- /dev/null +++ b/3b_layer16_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd603335fec5c7fb1aedb3f972c2689fbd2571edd9bf7ea3d7755369881193a +size 92585563 diff --git a/3b_layer17_mlp.down_proj_input_reasoning_representation.pth b/3b_layer17_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8792d35718d25ccd4fdb357399cbc658d71740c3 --- /dev/null +++ b/3b_layer17_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5ed0d1360aa0a5c356b714bba09d74bdfce753e877a560730b21d6db18b1c0 +size 246892108 diff --git a/3b_layer17_mlp.down_proj_output_reasoning_representation.pth b/3b_layer17_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d14ed1aed817a763847aa72b9907e6269845989 --- /dev/null +++ b/3b_layer17_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9aa8b2d2d4fb074086eece09051549778d88b322cabbf193f400f23e610f1aa +size 92585553 diff --git a/3b_layer17_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer17_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..09cc66894bdd69e088fedacfabda657512610de2 --- /dev/null +++ b/3b_layer17_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2983219d1869f121149db4c8dfcfde6da36cce69de9be0d7df71a07401b73434 +size 92585548 diff --git a/3b_layer17_mlp.up_proj_input_reasoning_representation.pth b/3b_layer17_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..39ea6caa8a2c954bf04e05cbc8d818b765f29df4 --- /dev/null +++ b/3b_layer17_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc4ceb6ee214182632874724816f860a7d3dd1b13898e2c0213fd09b209dacd +size 92585474 diff --git a/3b_layer17_mlp.up_proj_output_reasoning_representation.pth b/3b_layer17_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..32354aaa1675c67920393f48671617652696ab39 --- /dev/null +++ b/3b_layer17_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2423e8a6dec6205d15c3646136d4bd943c919a61ef71e40872cfeea15c300dc +size 246892103 diff --git a/3b_layer17_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer17_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..78ed16cedeb13df8729692b066e369bc2b092f60 --- /dev/null +++ b/3b_layer17_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aac62abd5af0fb34335c31001bc17a3258befa432b0c118c762e840405dd508c +size 30862944 diff --git a/3b_layer18_mlp.down_proj_output_reasoning_representation.pth b/3b_layer18_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f73ef80baed0feedfbe9e2a0a08f5039551e240 --- /dev/null +++ b/3b_layer18_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48990044ce78dce740f4c3169345668294030c6c8e255a71784226789f3c58a +size 92585553 diff --git a/3b_layer18_mlp.up_proj_output_reasoning_representation.pth b/3b_layer18_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fc4ff633e7f4005a9ffc2115d49c34e2b42b0095 --- /dev/null +++ b/3b_layer18_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9727da571130a4ae3ca8949d8aa2e5c9cb6c88af4f78a930b0a667dbbe080863 +size 246892103 diff --git a/3b_layer18_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer18_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..27383b0639fcb1a4dcf369dcd76c82996f19d6c1 --- /dev/null +++ b/3b_layer18_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f21135eb9edb6f689e1559abd621f8960256b4325062ad0240a05a3a4b5d83 +size 92585563 diff --git a/3b_layer18_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer18_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdbbf2d73c988b3bf35f150e82449600410157c5 --- /dev/null +++ b/3b_layer18_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8990df073fb76ef26747114b7fb96719668d1b454e6959a7e5bea07aa0bf6f +size 92585563 diff --git a/3b_layer18_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer18_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0cae97ccd454b154436c32d2b737f23a9328083 --- /dev/null +++ b/3b_layer18_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6e454d41130e6b196f76c5150d6f94d9f8664a78a725465765aea7a9164571 +size 92585568 diff --git a/3b_layer18_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer18_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3111ae6156418a72223db92e2ee6cf254e700840 --- /dev/null +++ b/3b_layer18_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa210e8d9725df8630cc47a1007eca5f088b44ceb7cf8c7331bf36d8a702202 +size 30862944 diff --git a/3b_layer19_mlp.down_proj_input_reasoning_representation.pth b/3b_layer19_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..98a84c98c15c2fca5930240660742251203e2e07 --- /dev/null +++ b/3b_layer19_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:684d352bc0716498f16a6de65499306e05b4d72c3223b2b1dd537cd1055ad084 +size 246892108 diff --git a/3b_layer19_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer19_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ed9bbabba4ae9e76a4fb2942dacb69b9ad4a13d --- /dev/null +++ b/3b_layer19_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e58967f14471caa3078d87428ebe28ab18e1a20c4e88bbbed5aa5532a21bfe5 +size 246892113 diff --git a/3b_layer1_mlp.down_proj_input_reasoning_representation.pth b/3b_layer1_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d546aea2b323ae7fbf4b7114502442896fafb4ec --- /dev/null +++ b/3b_layer1_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c4bb984b8b0b9e97dfeee0eaeba5b5ee0942281de6b540616fa5c9c36dc992 +size 246892103 diff --git a/3b_layer1_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer1_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1beb1cd9d6717434363f53fc193b11f77d06c11a --- /dev/null +++ b/3b_layer1_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1ceb0b3c8efa82374a8fd241952adb27e07a29dc193f6c763979603208dfca +size 246892108 diff --git a/3b_layer1_mlp.up_proj_output_reasoning_representation.pth b/3b_layer1_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb8a473bf57834f4c8bd9ed1802f574be9b97ebe --- /dev/null +++ b/3b_layer1_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af872797ee96b3a7f680270773b60d66f7c70379ab97d87f63cb46ab92304628 +size 246892034 diff --git a/3b_layer1_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer1_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ae1bf3943635585653d60ded954c96c100998d1 --- /dev/null +++ b/3b_layer1_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7ae72f5aaa6bdf96d4cde89c4968574fea628eebd8dc4d1298df5a562b88d4 +size 92585558 diff --git a/3b_layer1_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer1_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..08e36cfbb91f7b7c9e2d4fbf47d32aab26222105 --- /dev/null +++ b/3b_layer1_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a390823c5505cc1f224913ce11eaa1aca26227301588c921a9698294d87c7f +size 92585558 diff --git a/3b_layer1_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer1_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..014e7ca27162d711df02613cc9fe95d248651d04 --- /dev/null +++ b/3b_layer1_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97727828892d8395c8b7470c0370d661c48b0a05cc39a06bad4bb5f8ad07bd57 +size 92585558 diff --git a/3b_layer20_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer20_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7a65f7c812659b92ae00891daa37103d7e8e5ead --- /dev/null +++ b/3b_layer20_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae8b5dc9b1f88e90d2cb90650060c0e15c470587baa68cfb637292509e50545 +size 246892113 diff --git a/3b_layer20_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer20_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..70710eb7aa931d2610a0bcc2dc8555046547f1bd --- /dev/null +++ b/3b_layer20_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47197eb10a2847baba9379d35b99f5cf24b6378c35520b6eabbb1e06cb179029 +size 92585563 diff --git a/3b_layer21_mlp.down_proj_output_reasoning_representation.pth b/3b_layer21_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f80223160ab8c67f139e6d08ac1df6af2b0d930b --- /dev/null +++ b/3b_layer21_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74318c1fc28e8593f1646893cef08cd79e676b0d43b0d5e07bc71969f6ca269c +size 92585553 diff --git a/3b_layer21_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer21_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a90d5b2ad096ff18d588f87e05f5d06ba9b81d3e --- /dev/null +++ b/3b_layer21_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6ba3acc65fc0155133968082299d7616d879d7a8927cf8ce56ebf82447bb3b5 +size 92585548 diff --git a/3b_layer21_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer21_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbb6b3c6b921e41d2ec081b90a2b005138ba9938 --- /dev/null +++ b/3b_layer21_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d7a1056695fb46042f2577e581a72b755f3296a4baa1cc8cc8392f89453331b +size 246892113 diff --git a/3b_layer21_mlp.up_proj_input_reasoning_representation.pth b/3b_layer21_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aef924dcc1adce549909f9620d9a424febf7a1be --- /dev/null +++ b/3b_layer21_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ada322622b9c19d8888a0f071052b50783c2b1f26d3d7ee0b3a19a7d09d83db +size 92585474 diff --git a/3b_layer21_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer21_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a11f0f2369979255b8bd01f8dfed1667b09dd80e --- /dev/null +++ b/3b_layer21_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce8eb3ba225379bd016f3520d7006eb503416d9beaa412a3a10773e98b49040 +size 92585568 diff --git a/3b_layer21_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer21_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7b7bc7a4893b54a4c5c588c0c28bacf88902210 --- /dev/null +++ b/3b_layer21_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ad204cd8650d519374722e338d44a50fd2c349cb8d35656ca8092fb6f8ffbe +size 30862944 diff --git a/3b_layer22_mlp.down_proj_input_reasoning_representation.pth b/3b_layer22_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5b9ff2c9a261643bb9492540f820ee0e704a3ee --- /dev/null +++ b/3b_layer22_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b3d73297d2e4ef0081da0b5a99fff5e46f6a980698a8fc6025e2820c28f3dc +size 246892108 diff --git a/3b_layer22_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer22_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..39ab3399dd4f8319911829519aa5516a378268f9 --- /dev/null +++ b/3b_layer22_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0491c177d7fef34007213973fc9c204c1b3409ed2f2ba1fb93b76b9995b624ba +size 92585548 diff --git a/3b_layer22_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer22_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a600cd31f53f6589f9314b3b07d3b81a4d1307a2 --- /dev/null +++ b/3b_layer22_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6070b9299f64902bbc7364190e63276a542b93c02fa913bdef752dd9edc1bacc +size 92585568 diff --git a/3b_layer23_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer23_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5f5e4cef730487a91c088f2170452d44b93f746 --- /dev/null +++ b/3b_layer23_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4670142e4ad34adeac0a11d1db75239ac889395fd7f46bb92625395d9122ff92 +size 246892113 diff --git a/3b_layer23_mlp.up_proj_input_reasoning_representation.pth b/3b_layer23_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f2a9135c49fe47883c75cfdd231afe68eb4590f9 --- /dev/null +++ b/3b_layer23_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e6bf4f0a5e35b6634aeda06ffb3d617c98da1917358c353254728b68798d50 +size 92585474 diff --git a/3b_layer23_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer23_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba5400b3f1fe1550cbd33957853a1f523381e30c --- /dev/null +++ b/3b_layer23_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8376e49adfe2c77d846ac50204d9a4b3df65675abdee4dba39621b234eaa99a8 +size 92585563 diff --git a/3b_layer23_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer23_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca09dddf5d5fb9da03a2cd2853a8c4005ad3ad94 --- /dev/null +++ b/3b_layer23_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463b13aca5be21f8cb5373dce843f498d963f11526f57e257c18f8cfd1ac7557 +size 92585563 diff --git a/3b_layer24_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer24_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d67849c4987d17f60dfbc99bbefddcc2a9a3ba7 --- /dev/null +++ b/3b_layer24_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8987f7ac8145c8becf8b191fcc125b13c9a0dec7acd910402ff33c8700527aa0 +size 92585548 diff --git a/3b_layer24_mlp.up_proj_output_reasoning_representation.pth b/3b_layer24_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d7b214653e8921b782762c32cbbd109ab8c4809 --- /dev/null +++ b/3b_layer24_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8c384cae65d74db28952d0c487e116fc3568049df27289da51e36593985c11 +size 246892103 diff --git a/3b_layer24_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer24_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab65a2ff64022d2ae578511df35d08b54038dac6 --- /dev/null +++ b/3b_layer24_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7f8c534c0f4616af55479c356c82ff0409f386d534e3a444acf66eff92cf27 +size 92585563 diff --git a/3b_layer24_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer24_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..41e3ac609a181eaaabcb3f285a7e80c83f674f56 --- /dev/null +++ b/3b_layer24_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1088c7d5d2f2682eca0a0f84e761631abcd488e3cae5a4d3223a718c5704119b +size 30862944 diff --git a/3b_layer25_mlp.down_proj_input_reasoning_representation.pth b/3b_layer25_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bd7560e22b3186453d08cbb28a73cb7bacd32dd1 --- /dev/null +++ b/3b_layer25_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940578f98db2e9efacb3f1dad19777bd8f1a44fa68290a340ebedd4897378afb +size 246892108 diff --git a/3b_layer25_mlp.down_proj_output_reasoning_representation.pth b/3b_layer25_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..97597d481a584d3762cf37ef74811a9eb82f0753 --- /dev/null +++ b/3b_layer25_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b49cf26ec78739ab0ba3072a1bce02165d3cd93d2f7b5aa65ebde94135b2ce04 +size 92585553 diff --git a/3b_layer25_mlp.up_proj_input_reasoning_representation.pth b/3b_layer25_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..20415e0ea9070ee54d086f7ba182d8931db98c1f --- /dev/null +++ b/3b_layer25_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f91b0c4a413df60d32a6da090ebe2e3c3b69cd7166e378dc0122224cf9ef30b +size 92585474 diff --git a/3b_layer25_mlp.up_proj_output_reasoning_representation.pth b/3b_layer25_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..129f81630fdce0ca8d4d1b2dfe9a9b68208ed5c8 --- /dev/null +++ b/3b_layer25_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cafa0778167525b0e1c2494d0d521f93c0c05fc675ce9c4b4dc42d09d2dee26 +size 246892103 diff --git a/3b_layer25_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer25_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..481ac98f5f61785443b3e27469b92447d2f2e414 --- /dev/null +++ b/3b_layer25_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbea8651930c88b52278bce0511100cd0e1fe3c3d2cca879bc032b39ddf031fe +size 92585568 diff --git a/3b_layer26_mlp.down_proj_input_reasoning_representation.pth b/3b_layer26_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..25fa910b8b24b5bee3b76b73dc5bd765d8e5647b --- /dev/null +++ b/3b_layer26_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4dba3067d80668594ddaadf556feef0dcc824a89ae4d1b22b4f76a4cbb56b70 +size 246892108 diff --git a/3b_layer26_mlp.down_proj_output_reasoning_representation.pth b/3b_layer26_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..02076960a17f242e14837f389f13cbe754fa5372 --- /dev/null +++ b/3b_layer26_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939cf914bd45505160c35a5338b28fbe9e3cafdf87bab87a0c90af6ea80e30ad +size 92585553 diff --git a/3b_layer26_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer26_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..156d6226c97615772221505aab952ce8256341f3 --- /dev/null +++ b/3b_layer26_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8551131debfd049b16ec0eafe85a6395f1649ea7d8e17383ecea2f5de2de1c +size 92585548 diff --git a/3b_layer26_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer26_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..590b5a15d22982e58ee3f6d5da316fe7304cfbe5 --- /dev/null +++ b/3b_layer26_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91e74cecac8512d16621710266978aa3c8a2f7a02bdbae73de2e2d5e8f344ba +size 246892113 diff --git a/3b_layer26_mlp.up_proj_output_reasoning_representation.pth b/3b_layer26_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..48f05594c40c66899739f231e84a0b7f27bf691b --- /dev/null +++ b/3b_layer26_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc53373406e074a9f20941c67424670b79219375296d46d00e9cc5075df61668 +size 246892103 diff --git a/3b_layer26_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer26_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a2d0a8a11c026616ec6ccdf272a41e9dc64cc373 --- /dev/null +++ b/3b_layer26_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb953db4bbc5c5f51947464ea9fc282cb31033a3b1fee02eb37c641a056ec07 +size 92585563 diff --git a/3b_layer26_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer26_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..08384314d969edd02acc8708537396d99c74b6fe --- /dev/null +++ b/3b_layer26_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd396ed237a72a07a63f9730e866e912b8355dc71533a0428b2c60b9700455c +size 92585568 diff --git a/3b_layer26_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer26_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f11e02b987c36ed7e5d56849b32d693546c39968 --- /dev/null +++ b/3b_layer26_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19b0655366b6574164eeb9231ed6cbad1505ea61241dd62ce02b756a50909ea5 +size 92585568 diff --git a/3b_layer26_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer26_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2414f75c2390b7dde7c7131e7c40a68281dacffe --- /dev/null +++ b/3b_layer26_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08fd3c1b151f2b1714b908e4e198f8ed28f77d594c405566a368a0705295a30 +size 92585563 diff --git a/3b_layer26_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer26_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d9d32031a8018ce3fd4c59d9a8f3089b1bda141 --- /dev/null +++ b/3b_layer26_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc510884b3ac8a8e0381dfd5bb7128993dbb1dd503e6cc48f3c9afa15e20425e +size 30862944 diff --git a/3b_layer27_mlp.down_proj_input_reasoning_representation.pth b/3b_layer27_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c99d8f3f728acc7c339473cb2bed4b12205028f --- /dev/null +++ b/3b_layer27_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b898f1b9b2bd17ce305319ed8ff39daf8ff5fed56628796b16a327806a3451d +size 246892108 diff --git a/3b_layer27_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer27_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a7feb4432789e309cf57b042a39b856eb1d1880 --- /dev/null +++ b/3b_layer27_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160074afad5eee78e64353aedf9907f6675313e1f1df3942557f1e2ba962a3b8 +size 246892113 diff --git a/3b_layer27_mlp.up_proj_output_reasoning_representation.pth b/3b_layer27_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7bd7cd73ecc0ea91d32e619ad2f7d360b41a67c9 --- /dev/null +++ b/3b_layer27_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a0bfaface95acee366ebe4eaf6cb5f0bc0a8a6344e4dcfd0a3be89b61d9a67 +size 246892103 diff --git a/3b_layer27_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer27_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6bf9b01ebd3b6fb8b42b640532fedfee013b560 --- /dev/null +++ b/3b_layer27_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66bd44e3cea1b3fd537f0dc6ddb843a6634ed9f8c32d77413b3637c7ad62fd3d +size 30862944 diff --git a/3b_layer27_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer27_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b009bbea524e47d06063de85486bd7bdae6018de --- /dev/null +++ b/3b_layer27_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3686d94f1bdcc22cb2765885af8b7b9225db21d5df06c149d6467f5a463c0b5c +size 92585568 diff --git a/3b_layer27_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer27_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3597befb7eae01ffebf667a0047739a3d60918d4 --- /dev/null +++ b/3b_layer27_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbdc52811ef6d8664bda49634cfcf7973ef047623444558c0fd364a31ff0f05 +size 92585563 diff --git a/3b_layer27_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer27_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..27e2730e6faf84b5bbbf5ddb002d6b6a4f8638b9 --- /dev/null +++ b/3b_layer27_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d73b02ef876d2addcbcd58d0a9a20e80a9371f04d1c21f6e7b6d0f7943f04c +size 92585563 diff --git a/3b_layer27_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer27_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbfc983a9cdea7f85c752749e0fa5098e79a7a90 --- /dev/null +++ b/3b_layer27_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd50b4fba54e05f1731624afe41493bb80804b90d003305a8d5e70e7b75f59de +size 30862944 diff --git a/3b_layer2_mlp.down_proj_output_reasoning_representation.pth b/3b_layer2_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac5d137d9238003e464ff1ed8af51f271401a49e --- /dev/null +++ b/3b_layer2_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f94c6b5df47297bd6dcca1f23bf2218e1d38b5e605875c7d5561f2037b5d46 +size 92585548 diff --git a/3b_layer2_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer2_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b483ece1403a17b131e8041a37e40eedda8e723 --- /dev/null +++ b/3b_layer2_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd4343d70ef75dfed81001f5dc83d4f46908742d0c6ba076f2420f42de1eb488 +size 92585558 diff --git a/3b_layer2_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer2_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad413d1f9cf6391bbe8cafa973fee28abeffe57c --- /dev/null +++ b/3b_layer2_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37cd4f89ef8483003b9df47920ce95c0f96997d56742bd8f2708a3eb84f5112 +size 30862939 diff --git a/3b_layer2_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer2_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2bde62005a0d0275a6bb88fddd243037207da7ca --- /dev/null +++ b/3b_layer2_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ba3555dfbb984e1b7b296007753b80db5cf5ce32219331f88c199ee0dd328ad +size 92585558 diff --git a/3b_layer2_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer2_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b93914366bc454bb55a028c06899e4d4131ef9a6 --- /dev/null +++ b/3b_layer2_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538bdb851deaaab5e435c6c4650cde44d97c90da2a64ea8fd0718eecb9e9bb25 +size 30862939 diff --git a/3b_layer3_mlp.down_proj_output_reasoning_representation.pth b/3b_layer3_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3373f49684a9e83fa0025749a4dc6aa7acd1390 --- /dev/null +++ b/3b_layer3_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993212cc8aa80f93d68b0a84874ce3c3b171bf5ed08aa9c789b94a80e6281af0 +size 92585548 diff --git a/3b_layer3_mlp.up_proj_output_reasoning_representation.pth b/3b_layer3_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..072405b6832125633f9ba356c654e3fe368394c2 --- /dev/null +++ b/3b_layer3_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85fedd78e3cba0a6ef3d74d56da95046853d920cdce1704b793008ffc2bb42e5 +size 246892034 diff --git a/3b_layer3_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer3_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c73185b5f6422cca8b9528defa225cd6f58de24d --- /dev/null +++ b/3b_layer3_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9af45d7d24623569d184530d7a6ec08414a4549bedeef33b660d990ab93bfc4 +size 30862939 diff --git a/3b_layer3_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer3_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6dc04315586b2a5b5e7921d414a69a53f9bf8b00 --- /dev/null +++ b/3b_layer3_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b65c2af6e93d5267fe14e82a3eea77b56af472e74c99496d9d39f2513c4f7dc +size 92585558 diff --git a/3b_layer3_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer3_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..940257e6bded9dabcfe5daf84fcc9ed28d92cd0b --- /dev/null +++ b/3b_layer3_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22faee9b9390fad2ab4809afa53c140abf32329ba726c11a291c3953de13f86b +size 92585563 diff --git a/3b_layer3_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer3_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ca1586b9d436c49de0f3c1b7924f098007d5f07 --- /dev/null +++ b/3b_layer3_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f1d15e669d4dc4611ee52b6806ceb263ae6d3711ee3a2a88bfdba16561c95f +size 92585558 diff --git a/3b_layer4_mlp.down_proj_input_reasoning_representation.pth b/3b_layer4_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c79a50d3a41594d908607520a84d7311a3ab874 --- /dev/null +++ b/3b_layer4_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b335d038fc55592fb918dbc41677434cb583f76ad049d2c12426eeb5294623 +size 246892103 diff --git a/3b_layer4_mlp.down_proj_output_reasoning_representation.pth b/3b_layer4_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7e879a694c0070e7771badcb273b992738091f97 --- /dev/null +++ b/3b_layer4_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94f4239eafe9cca3c6428ab5c46edc2dc464d30275101e9bb0511369b56cee8 +size 92585548 diff --git a/3b_layer4_mlp.up_proj_output_reasoning_representation.pth b/3b_layer4_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee22199423e67cd05e99cc29fd418db8c5d50300 --- /dev/null +++ b/3b_layer4_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5161e46dbbe6fd431672db0a0bcb15ee802caa0566044aba14eadf44751868d +size 246892034 diff --git a/3b_layer4_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer4_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..53519b32f776e0edca992cade295c5175340aa2e --- /dev/null +++ b/3b_layer4_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3174c1f62fb92350618d02aed05d92412f44c37a4bd61484a2faf5a7f8bda1 +size 92585558 diff --git a/3b_layer4_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer4_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1000e499e27933bab631a8af017c48db38feba98 --- /dev/null +++ b/3b_layer4_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8085544a4b35d544479cb4f64a6e7ab0054c860421f684b2d1989e499fc0346b +size 92585558 diff --git a/3b_layer4_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer4_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b8d03ec7b6dacd617eda731b79a7e6883715d47 --- /dev/null +++ b/3b_layer4_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f298b96e36db8d3c0c0c367ac1c4957d2a99daa57b0dcb9ddd269136cb9e089b +size 92585558 diff --git a/3b_layer5_mlp.down_proj_input_reasoning_representation.pth b/3b_layer5_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..89a998bbcda08b0a08e8eaa458c321dfdafb95e4 --- /dev/null +++ b/3b_layer5_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8486176b1339e16604c3a8a530f6793ff8762da19958c394dbb842adca2398c1 +size 246892103 diff --git a/3b_layer5_mlp.down_proj_output_reasoning_representation.pth b/3b_layer5_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..26be4de2ba48775cc749f0fa129c5a563f4f251c --- /dev/null +++ b/3b_layer5_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5995c23b73f31c9c184a7da22029411f5a1b2094c1adba0437d76e7784d465ff +size 92585548 diff --git a/3b_layer5_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer5_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..443d031408833c7ad8a7b1cbed98262fb9ed4b87 --- /dev/null +++ b/3b_layer5_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d302a39010a5774f521593dd7af1caadc0afedc1d7b0053016217182fe27cce8 +size 92585543 diff --git a/3b_layer5_mlp.up_proj_output_reasoning_representation.pth b/3b_layer5_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce95db002df8c3986d314fd6bb22c52ba3ba277b --- /dev/null +++ b/3b_layer5_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31587a321faa54358e547bf2f4087da457c019cc1833d3549496a8eb20fa2f22 +size 246892034 diff --git a/3b_layer5_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer5_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f249fab1baead534dac9fff2dafee33bc82a27d9 --- /dev/null +++ b/3b_layer5_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7fe2c9880313562b6afe1e497fb8f889261e09d64b8822cf2913a739e678df +size 92585558 diff --git a/3b_layer5_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer5_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cefd47a714f5851eb939725313f41ea52e07230a --- /dev/null +++ b/3b_layer5_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b30396ccb48e3d6a8081e6ab55258b2ead3eb115daa1eef2626606b9eba233f +size 92585558 diff --git a/3b_layer6_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer6_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d1bfd7efc6f891279178d55cc146720b79bc9f7e --- /dev/null +++ b/3b_layer6_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd79323478f013ca83a4ff3112a085d23ed0acf5e061141ea5e756db06fa7e3 +size 92585543 diff --git a/3b_layer6_mlp.up_proj_output_reasoning_representation.pth b/3b_layer6_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f5c4830ecfcd1a79f71670a28b6f499b4824436 --- /dev/null +++ b/3b_layer6_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc0ccc819bae2d41a3d45f46d5d0eec9b2082dbf41248e7692e58ef281671f0 +size 246892034 diff --git a/3b_layer6_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer6_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d1d15aca8447c01564390b153b18bbb81d48a1b --- /dev/null +++ b/3b_layer6_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3b79376d7099a18dfbe9e89ad1de21f5210bbf02d224f3a9e024e5c1d346fd +size 92585558 diff --git a/3b_layer6_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer6_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c7e4ba79cdbcf46b99bc20845d58a83d8443266 --- /dev/null +++ b/3b_layer6_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3232f126e4f772841e47a8f5fd50bb095f8a0757929cff1f30c01b2e3d801a +size 30862939 diff --git a/3b_layer6_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer6_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fb673cf4d673e68658e036ebbfb90750574307e --- /dev/null +++ b/3b_layer6_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49f903235facb83151bbc3cc6e6a8b1ccf2e321286d1fa381bf4cb41e0330d4 +size 30862939 diff --git a/3b_layer7_mlp.up_proj_input_reasoning_representation.pth b/3b_layer7_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..612850c32fed9a20e33ddfe15306e1ba0ef5a24b --- /dev/null +++ b/3b_layer7_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c39ddb8a75d1b22c931031a383c67264dccc5e958a1fa162cd5f2a6f2c84cc42 +size 92585469 diff --git a/3b_layer7_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer7_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8eac08b4b4c06e6e0f2f4864641ac147ccc176b1 --- /dev/null +++ b/3b_layer7_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ef798b4791c14ca904d7d2625172f75c1260dcbbca768a06c31fb023db45cc +size 92585558 diff --git a/3b_layer7_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer7_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9e57ae9be92d9191784b1126dde85e75027bbbaf --- /dev/null +++ b/3b_layer7_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1eb335ad447d0bb88a3803bae834a9714a9aabefb66db66e99592676d1288de +size 30862939 diff --git a/3b_layer7_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer7_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..729e18affa2d0dd1679fede5530fe3883e1eeb28 --- /dev/null +++ b/3b_layer7_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f1aa5707acdce5451e94316a37f577000895adf4d2a42dfd5e816bed6b46a4a +size 92585558 diff --git a/3b_layer7_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer7_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4df06906a9216413bc074b6392cfea10401c9f9f --- /dev/null +++ b/3b_layer7_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2265b552d8cbd31c5856d157e6261f92abdfe66c0509cf0f31c1bf6d7bd894 +size 92585563 diff --git a/3b_layer8_mlp.down_proj_input_reasoning_representation.pth b/3b_layer8_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..28adf5d8693e90d69de5c59bdacf2651ed565987 --- /dev/null +++ b/3b_layer8_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af2562c70989c3ed575b2992574c2aeffcfb47af9e0422e155594e1a2f8c92a9 +size 246892103 diff --git a/3b_layer8_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer8_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c64f1b1c0b46dae8c273c782664b68637972a109 --- /dev/null +++ b/3b_layer8_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ef883587ec389eb2aacf0a11593fc5b1db8ace5f26a69118ec2b306408c6e2 +size 246892108 diff --git a/3b_layer8_mlp.up_proj_output_reasoning_representation.pth b/3b_layer8_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3843dcf7704ae8421d85f305e180d7a3ffba66de --- /dev/null +++ b/3b_layer8_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c795e4c123d24affe1703ec87b1df5196c2d0c2206f75fbb4d75ab6e0b8c18 +size 246892034 diff --git a/3b_layer8_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer8_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..baad324c866e5950fc29f52dbc1a36d668f8a81c --- /dev/null +++ b/3b_layer8_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a409eda94293d1ab9f06648304188795d20af6c63bdd56199c594461c007878 +size 92585558 diff --git a/3b_layer8_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer8_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e33db3058a385918bd82701669de9f62dcd6829 --- /dev/null +++ b/3b_layer8_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0391a5ada8ffa2692f704fcae4bfc2fb55a2f38228a89be774bba09226d5e9fe +size 30862939 diff --git a/3b_layer9_mlp.down_proj_input_reasoning_representation.pth b/3b_layer9_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0be48f16dd88fd6614b24d76c0f5b7fc394abcd8 --- /dev/null +++ b/3b_layer9_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8a0f012bc34931c41f6e61af1d62ce29eed18fef5bda60b1c1f9cfd9e5bb21 +size 246892103 diff --git a/3b_layer9_mlp.down_proj_output_reasoning_representation.pth b/3b_layer9_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5b5abdcb46805d4b1cd2f210a44186ebe3032a3 --- /dev/null +++ b/3b_layer9_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd204580fe0d00c91e585b5ecfdf061f4dbcd607e1dcb6bc80696fff8ba07a8d +size 92585548 diff --git a/3b_layer9_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer9_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..27d31ecccf1d9a88476ee3bd7999d575531b5c1a --- /dev/null +++ b/3b_layer9_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334bea76b91eef769a2fedadb105de2e70104a0fe60eda44cb63e530efa4b65a +size 246892108 diff --git a/3b_layer9_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer9_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5550ed8a217f3e421f9431b7bdeb451a64a2b558 --- /dev/null +++ b/3b_layer9_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9b790098b197fada52615ed675cd06a3aad18025019604668ddd18d86ebb5a +size 92585558