diff --git a/3b_layer0_mlp.down_proj_output_reasoning_representation.pth b/3b_layer0_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5321cbe4f5f21c8cff4bc492dff8d4b0544756fa --- /dev/null +++ b/3b_layer0_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf80fcbcfff5165d31b7e8a8b56a912cef82b8a14013224b1127f231880b0014 +size 92585548 diff --git a/3b_layer0_mlp.up_proj_input_reasoning_representation.pth b/3b_layer0_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6b83dfe981afaa9411e252a36cd0ce7eb6b7c15 --- /dev/null +++ b/3b_layer0_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ed4c7c68c1896efb7c2a79f17b11d7b908186df858e793bfd3090877e30c98 +size 92585469 diff --git a/3b_layer0_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer0_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5323a6e48b240f867194f5a3ff943411ac6ecfc --- /dev/null +++ b/3b_layer0_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0f350eb70d5d709ddf82d4430713e0f6252be21c32a05080643384522735dd +size 92585563 diff --git a/3b_layer0_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer0_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bb641358b7be81105d40e32b042cd279dd9a122f --- /dev/null +++ b/3b_layer0_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c039231a4b36b209701521d2c254d46dd55241cfa157ecc61b5ade079acb8c27 +size 92585558 diff --git a/3b_layer0_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer0_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..df8847d9456d52db0af7ffbc7ec9727cc92da142 --- /dev/null +++ b/3b_layer0_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e242a2d8e784d8d3b5f773d5c76a300026fd44100fcad7f3b362897324de0ed +size 30862939 diff --git a/3b_layer10_mlp.down_proj_output_reasoning_representation.pth b/3b_layer10_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..23697a8ea8583ba760d5dfc486d25bca75f7ec9a --- /dev/null +++ b/3b_layer10_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbaa016dfc59afa00e10846e13773451acf36127a6bf7817de9d23655d301dd4 +size 92585553 diff --git a/3b_layer10_mlp.up_proj_input_reasoning_representation.pth b/3b_layer10_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3156dc7aa966c6ff55debae5c371e04158b7317 --- /dev/null +++ b/3b_layer10_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ea58e2b94fd5285efa9bba1d4fa829de9ca7edea7dff7f43da4b2eec8d4582 +size 92585474 diff --git a/3b_layer10_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer10_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..50aab749b14ed0bfd0a42d1c08d38d7c714b408e --- /dev/null +++ b/3b_layer10_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1a02e9d94843315a3f416a70f7d2b23856374ad7af0abb2b88da9822ab076f +size 30862944 diff --git a/3b_layer10_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer10_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d8b6f43c5cf6937ea0713533f94007f19ba632f --- /dev/null +++ b/3b_layer10_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d67a41010eda64c8c192a6522ef3d2812d4abe8ed7f8c475430c23a1529c8c +size 92585563 diff --git a/3b_layer11_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer11_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..59117759c7ebdcdac08dcdb2da03ea7be73b0d0d --- /dev/null +++ b/3b_layer11_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f038f0b5744b7887f204f60b63e8529239b05942dada4ab5fa2d7ae42d54fc83 +size 92585548 diff --git a/3b_layer11_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer11_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4866ff8f9fcac1d336af20db1e1cda1137528aac --- /dev/null +++ b/3b_layer11_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8777c6ef5d6975003b7c69cded198f867986293caaea4218d2d5d7bcc9252f +size 30862944 diff --git a/3b_layer11_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer11_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf84386c05bf2778a38add927a4db49ac1ab6ff5 --- /dev/null +++ b/3b_layer11_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9402a3923b762f80add3c5fabaa5743a2837037b388c9932ba6502f7b138162 +size 92585563 diff --git a/3b_layer11_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer11_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..202831e1435dbe4a676c6b63e55cfb12f88e4a66 --- /dev/null +++ b/3b_layer11_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baae69942a7a099b45cd45bd68d56263d57b0410e7fb64cb52c78897aa854942 +size 92585568 diff --git a/3b_layer11_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer11_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e284319d0e96f24b2b11dc008a0997b4b75b790 --- /dev/null +++ b/3b_layer11_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7fc27ab57bf520d97f2e5f3a45ebfd1bcb93be7088e6a143579c32c188176b +size 92585563 diff --git a/3b_layer11_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer11_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ed42936e84789ce4ced6c0053234611dbccbe75 --- /dev/null +++ b/3b_layer11_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb14c51095b5b4c04df0b796b9c8d5b5b443dc3545e820e75ec9c7cc7ff6e3b6 +size 30862944 diff --git a/3b_layer12_mlp.down_proj_input_reasoning_representation.pth b/3b_layer12_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b2cf5328afb3e74086159dcd87754f16d479fd3 --- /dev/null +++ b/3b_layer12_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7fefbd4a581657696d0821ed7586fa3f42da2bd3d4f636c5edfd34aab086aad +size 246892108 diff --git a/3b_layer12_mlp.down_proj_output_reasoning_representation.pth b/3b_layer12_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae51c43b2334216cc75544458048b9ae4e6d8498 --- /dev/null +++ b/3b_layer12_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a755f527b055fbf424658000c5d73679e9c6a1c57432845b322b94c6f607554b +size 92585553 diff --git a/3b_layer12_mlp.up_proj_input_reasoning_representation.pth b/3b_layer12_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0366c5f9c14c91f9dd582c0fef5c31272ca70539 --- /dev/null +++ b/3b_layer12_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d70ad18f4509775a5eb7211f2990d65bc00827d5ac5a05fbb63b0e3eb6e263a1 +size 92585474 diff --git a/3b_layer12_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer12_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..713bb227e0f6e5be37230697b73ce7457c7f2f12 --- /dev/null +++ b/3b_layer12_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75599b56ac3a9e7addffe0948bd70d74add10e6ba8c61c1dc5e358db38b9aef6 +size 92585568 diff --git a/3b_layer12_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer12_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..18250aed742c3c18404a9ba6773f820e9a9c2c06 --- /dev/null +++ b/3b_layer12_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae8683ac098e12a459fe2991c3495c5cd2f309bef7579e7d90afae1405d8bcf2 +size 92585568 diff --git a/3b_layer12_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer12_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ba72be90d7e8ae6f653baa0a3119a1dc8005503 --- /dev/null +++ b/3b_layer12_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71bc90db722eff829fc0d68f1c43f6fcc23e6ac884b3327a91f10bf47171274 +size 30862944 diff --git a/3b_layer13_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer13_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..00024ee244c4388c1e109140119517065c438729 --- /dev/null +++ b/3b_layer13_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5712fa824e876ccd5b646f60da90bd60da8efee186624d161ed2884bcca47f3c +size 92585548 diff --git a/3b_layer13_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer13_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3f9da594301caaffa4cdc1920f64da646c04982 --- /dev/null +++ b/3b_layer13_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8dffaf45863da0fdb1808631c9bd0bafc0fe161923672fef0ab60e961efc2d +size 92585563 diff --git a/3b_layer13_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer13_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..005a3db47ce9f04baaa1e7551898cd9fc0665ff8 --- /dev/null +++ b/3b_layer13_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7453086540d6e295ee6820726a97924e59ea6024aae1aa11ec3e5da080d9e45d +size 30862944 diff --git a/3b_layer13_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer13_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe83ff5c50247a7303ef97d73de5ebc0819da158 --- /dev/null +++ b/3b_layer13_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d717f874689b0dddf20d919e7383c99b68b6e44022507cce83f6fbf7d26f2cc +size 92585563 diff --git a/3b_layer13_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer13_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5436836649e4b10567c2d58568f14a051e0d1715 --- /dev/null +++ b/3b_layer13_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c4323803b7c9a1c49153c244bf4afaa832c40f6356a6f6e9b39fe37d4f9ab2 +size 92585563 diff --git a/3b_layer13_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer13_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9dfc9bfc7c0f564997f81fb3a34d9f5bcb74a8ae --- /dev/null +++ b/3b_layer13_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23961119efa2e7224c198e04f01604a4001118a22b9dc41dcc8a3c87eef58fca +size 92585563 diff --git a/3b_layer13_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer13_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..99c9e09f9f441eae0b9fc1d6b073df4807702795 --- /dev/null +++ b/3b_layer13_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ae8edeeade4df3d983f89ca0ce6b49a121e981b7b7f0391440469f4fbd12d5 +size 30862944 diff --git a/3b_layer14_mlp.down_proj_output_reasoning_representation.pth b/3b_layer14_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c34155f33a07329861b0ebe4e2e8513c78abc4b0 --- /dev/null +++ b/3b_layer14_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344f6f07fd8e4b4eca7f04155fc5b060fb36907d84879ccb853b1b75d32d6df0 +size 92585553 diff --git a/3b_layer14_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer14_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a52572c8a6b03c0ba3b8c16170177c0af31d144 --- /dev/null +++ b/3b_layer14_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5466ae22cb002b3d32f31e2bdb9c7c4e1243a7bb450928867838b24de3605f9d +size 92585548 diff --git a/3b_layer14_mlp.up_proj_input_reasoning_representation.pth b/3b_layer14_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3356016178825f6ebaf547aabf760794b1a0911 --- /dev/null +++ b/3b_layer14_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464b6b9dee423609689707ed82eb80a246791eece066507e7718d843a629ef87 +size 92585474 diff --git a/3b_layer14_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer14_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..45f4a8cdda5db0247fa08eee66b04720516db01c --- /dev/null +++ b/3b_layer14_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f983ea5af855bef29c2029e31c5c9a38da491a99712d2e097eb1e456ead144f +size 92585563 diff --git a/3b_layer14_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer14_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ecb66ccea4fa3b80db19b875f237e561fdf87a3 --- /dev/null +++ b/3b_layer14_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58411eb616fc3666778945ebd9300c4fa17595c5d0c49937d0d177c7f39f5685 +size 92585568 diff --git a/3b_layer14_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer14_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a041ea67b8240a3aa5063a03f08d6a29e1b00fb --- /dev/null +++ b/3b_layer14_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97cf375bdb0afa94e392c881e4d0782a769933814a528081091ea06c11639ba5 +size 30862944 diff --git a/3b_layer15_mlp.down_proj_output_reasoning_representation.pth b/3b_layer15_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ad1af84a71af96bb62dc9bbb6ca52fe27781631 --- /dev/null +++ b/3b_layer15_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940248560b76e1c5efc1d59a470dc340f39adef799af54fc9b54b139ecd67ee1 +size 92585553 diff --git a/3b_layer15_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer15_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d98adc1def0391fc23326a09fcca30968e64f27 --- /dev/null +++ b/3b_layer15_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6209159fde9aacf557377b96fce10b296ff4085e32039a87a4ef214f7ca7db7d +size 92585563 diff --git a/3b_layer15_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer15_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..44e0c47440039a9f5fbbe65bda6d0b9e92bd0157 --- /dev/null +++ b/3b_layer15_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0ea404f5ef55b271b0032f97915c1bef3497fb3306530606fb381d620b47fb +size 30862944 diff --git a/3b_layer15_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer15_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f6dc22fb3ec5513b0c5bb680f68b186359ba20d --- /dev/null +++ b/3b_layer15_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ddc210d1fd1ad0f339e3e9797d672e04f94e9b03441c603a002de6a7a5a0c7 +size 92585568 diff --git a/3b_layer15_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer15_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd38a9582fcfa60d6838dc8bf8de874db5b6992a --- /dev/null +++ b/3b_layer15_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d32c4d3f5a3af52262b9323d27040317fa8e075ae955f0fde094f98f8a6da5 +size 92585563 diff --git a/3b_layer15_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer15_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0dd539c0ef07e3355394f66fd20d8db7202301c4 --- /dev/null +++ b/3b_layer15_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545086911925d5184d0865bfbc0d15d63c3f0298baecbebef7100ac264b182a6 +size 92585568 diff --git a/3b_layer16_mlp.down_proj_output_reasoning_representation.pth b/3b_layer16_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0988b91535b100079cce1603bafe7873da055b76 --- /dev/null +++ b/3b_layer16_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b863fbc81521f2d63df988848da78b1884d817819f6651e3949feeeb7ec4a9 +size 92585553 diff --git a/3b_layer16_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer16_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fac73466bdb456068145e64bc372d30ab51e7e05 --- /dev/null +++ b/3b_layer16_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38e05f89210fd3a99be45bad4f5b522959eb5eed69419cf0f8a7a1ce2b02ec8 +size 92585563 diff --git a/3b_layer16_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer16_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5d965f876ec3ce225279be100ceab7cae8fc234 --- /dev/null +++ b/3b_layer16_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c68549df32433e162e6895d07f812bb894539a457cadcd7abe028337f959559 +size 92585568 diff --git a/3b_layer16_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer16_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6156193d280d038bfb406796ebe1b4c94f7de50 --- /dev/null +++ b/3b_layer16_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02abdfbc97ed0efb1636412098d41f8d3523efed1a6b7405e7145c456fb959c0 +size 30862944 diff --git a/3b_layer17_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer17_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f467c4ba8b4655a8320ae44d5722582070718c14 --- /dev/null +++ b/3b_layer17_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded45ed3118eba4b0446f3073fbb8babf4baab684fbcb6b38c3d7fe3b0f5beca +size 92585563 diff --git a/3b_layer17_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer17_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..497f9a9dfbbed33eb1d2f36dbf6fc2f88b9a21d2 --- /dev/null +++ b/3b_layer17_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08386fe4e3a86de5068b2e050014a3fd0a143a286c323806ccd75068f006247e +size 92585563 diff --git a/3b_layer17_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer17_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a1e1faec081bb23dde246d5c9c9186e67edc8a66 --- /dev/null +++ b/3b_layer17_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e426177d118d7743c6211d7a8abad4bc9033556dab922e822e7a40da56a9042 +size 30862944 diff --git a/3b_layer18_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer18_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d3c5c483a2daf485641e10d87d0a1bac92441e2 --- /dev/null +++ b/3b_layer18_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d9ce65d3397cf5f8c79dba2fe2bdaecb77255f6a59678beb25d5f4cf26a81c +size 92585548 diff --git a/3b_layer18_mlp.up_proj_input_reasoning_representation.pth b/3b_layer18_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdbafd5de850cef62757fd739e05aada888383c6 --- /dev/null +++ b/3b_layer18_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26ae5dd56682c95402a53d68a5caf46eaf7e4beb5428603bb635fefed1cb019 +size 92585474 diff --git a/3b_layer18_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer18_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fbc61bcd171df165742a9ddfc526016f102beba --- /dev/null +++ b/3b_layer18_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad177504107834f8e7fcbd9be11b0597fae189bdee63c379426e2344968c82a7 +size 30862944 diff --git a/3b_layer18_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer18_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..41932ca0f0f41ed2a9ff9570b6ffdcdd7cc6c9e6 --- /dev/null +++ b/3b_layer18_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54446484106285d9acd82516fe6d43c362af51a8efdc4f7e4cb8b028528a207 +size 92585563 diff --git a/3b_layer18_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer18_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f436a74af82cd708d48bee7038150e386cd22eba --- /dev/null +++ b/3b_layer18_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443fee48be443b8f0724600691b378732257e669b399b23ccd8e36cc3853ce9c +size 92585568 diff --git a/3b_layer19_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer19_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..959a9dee58b35a595dc9ffaaae5289218ffadff5 --- /dev/null +++ b/3b_layer19_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ddd57bf46cf9417cf9987b0802447427b1324c2030071aee73cd6959996bb6 +size 92585548 diff --git a/3b_layer19_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer19_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f1773f54891a1ddb1af48aa0e1728d3051a6097 --- /dev/null +++ b/3b_layer19_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a216cc443d7d87c8d2f177858074b502d79d2b3f27772d588ee2ee25a968bf88 +size 30862944 diff --git a/3b_layer19_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer19_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..10ea496132b7ac6b8ed6696bf6eabaa1ae8ebaa0 --- /dev/null +++ b/3b_layer19_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052c375b2768a7157928d7734444460f4254fbd1b959d6176e973baa49736db3 +size 92585568 diff --git a/3b_layer19_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer19_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4b598af69713424fae2ef348840630b848ef979 --- /dev/null +++ b/3b_layer19_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735f499f0ee1acbe0e5498ac91544ad24400fde23225c4f0f60b7501271d2baa +size 92585563 diff --git a/3b_layer19_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer19_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..17971cb3642acc1ab1101792536ffa9c247523b7 --- /dev/null +++ b/3b_layer19_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e33cb7bd528dd64edda24a0ecc1a9ac7b24b4ad6a6c124f4718cd383ab13b87 +size 92585568 diff --git a/3b_layer19_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer19_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b63bdc7ea69ae80f673394cb0800992c07cf5e53 --- /dev/null +++ b/3b_layer19_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ab26f753439c105187c39a4e37a97b49a387a5e8d44bea13638afaf5c73678 +size 92585563 diff --git a/3b_layer19_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer19_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba163a63ef8f278b312ee22cca031af64ae64161 --- /dev/null +++ b/3b_layer19_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4cf73f1bbdacb788af07ec90edf198803a0cf9df86a5e4073fcabd4cb747377 +size 30862944 diff --git a/3b_layer1_mlp.down_proj_output_reasoning_representation.pth b/3b_layer1_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ac48db80259f69c3e5968f911cad4ee2ff06c9e --- /dev/null +++ b/3b_layer1_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c283f6542cff6e6fba706c975357d73c1c2f6c92c13058639d9ae050a57230f7 +size 92585548 diff --git a/3b_layer1_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer1_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f02017a5c284594acf1016efd77e301c389d216b --- /dev/null +++ b/3b_layer1_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556fe05fb26fe3844b8f1f0592f9be1a4f0bf08964cccab03957bf7b37a4ae85 +size 30862939 diff --git a/3b_layer1_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer1_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9f1dc33bb7391744ab0de53541b53541be0ff6d --- /dev/null +++ b/3b_layer1_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89c1993fa50970eeeed53afc29f0c7b96f5844ba642ef5d8471aa93f7aefd09 +size 92585563 diff --git a/3b_layer1_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer1_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb529808a5d014fe7b7d115bfe5a863686509cf1 --- /dev/null +++ b/3b_layer1_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac30ad264c73498020bbb581371f223f674074a3884149dd435bb46c63e068c +size 92585558 diff --git a/3b_layer1_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer1_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..15c0b91157c347f3c02fee6d812c767c37a83809 --- /dev/null +++ b/3b_layer1_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1143d39c1361699ad42bbeff810fc61c5d1f4fa1e95815505eb545ac63676d +size 30862939 diff --git a/3b_layer20_mlp.down_proj_output_reasoning_representation.pth b/3b_layer20_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5897ccd90b275831f35bc2013219b84d7843fa2 --- /dev/null +++ b/3b_layer20_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed98c7ac7b8f1e528615c6d5eebba096a38364adb6e8037863e4c27d8045ae34 +size 92585553 diff --git a/3b_layer20_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer20_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ae152af1bd0054fc668becb0172134cd305f51f --- /dev/null +++ b/3b_layer20_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0600608da4659add1bb827a895179b446a9e49f7b9b7a904f901c468b08c4a42 +size 92585548 diff --git a/3b_layer20_mlp.up_proj_input_reasoning_representation.pth b/3b_layer20_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3966ffab4e20f6f41d6862cbc85c1dc96a19f52 --- /dev/null +++ b/3b_layer20_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619d592c3dd72c30cc4a907660ae02c26038d8756096da5d3fc0bb84891f7f7a +size 92585474 diff --git a/3b_layer20_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer20_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7d5e6b0b9dba7f849ace5b552341391bec8862c --- /dev/null +++ b/3b_layer20_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b677f862be89a68482195496ead9b91547339d3e46f58c8f99813e30016e3d +size 92585568 diff --git a/3b_layer20_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer20_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b86a111e36e3d8872764cd5c17745ec8ecc35069 --- /dev/null +++ b/3b_layer20_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dba8d4c3fd39c37433674e408242a1d1e62ef2d2ab08ba63f6c2d4a4d986a6d +size 92585563 diff --git a/3b_layer20_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer20_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..05ce67d51dfe88a1eaccff7738ae8991d5dbc256 --- /dev/null +++ b/3b_layer20_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e46c07b4c525301eb5587fdc939ac8207fc48e74a9840e3c51a9f13f4731f3 +size 92585563 diff --git a/3b_layer20_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer20_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..abc2ea3b397b7106c48deb0c472259761686243c --- /dev/null +++ b/3b_layer20_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9726339f506f7592c5256677b3351526ed1e37c7a944bd212d59617e389f6c48 +size 30862944 diff --git a/3b_layer21_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer21_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f9d06e55f336cd91281880d65d83617a31c3cea --- /dev/null +++ b/3b_layer21_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef273d9d2098a36f0b9900f82e384a169d9da773351c08376f643cc6e6bed1a +size 92585563 diff --git a/3b_layer21_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer21_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..752ebe57db483d2bf5c2b557fbd5048f46f4d1b9 --- /dev/null +++ b/3b_layer21_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae766f7f83dbbbf1e00b48d2f91ccf687094d47e3eff957f2663f2e9be4fd2d9 +size 30862944 diff --git a/3b_layer21_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer21_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa1a05d12d4f56292aa880a19f8c23ac0b6da3ed --- /dev/null +++ b/3b_layer21_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18654d048f840ef3d4a0aa9944042fbbb56b5e273e97d13b04ce502a779835d9 +size 92585568 diff --git a/3b_layer22_mlp.down_proj_output_reasoning_representation.pth b/3b_layer22_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bbd4b1d4c7fe3d5e3fcb95b75953b9bb27f1c8ed --- /dev/null +++ b/3b_layer22_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e4e06a1177d2e6cd7eae45f3f751f7d62e67ec2ca96de898794a845d4e81cb +size 92585553 diff --git a/3b_layer22_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer22_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ebbbebbba54edf8e702dccb784a02994bf89919 --- /dev/null +++ b/3b_layer22_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0217be2221e1473c437bb6572888560d6356c62e059079f123c152f23978b3 +size 92585563 diff --git a/3b_layer22_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer22_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..26d7ebb70c24b3be5927a6bb7730f26e24091e96 --- /dev/null +++ b/3b_layer22_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5330b593d9d632f3f6d1e8efa948a49617b9191dcfdee14e5363daa453513e52 +size 92585563 diff --git a/3b_layer22_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer22_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..087f01088d05f3d6ed52d1d6d502662d4d662e4e --- /dev/null +++ b/3b_layer22_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ce7fbeb8a6dd9074f79909d05e55a33dc2ff7f85df8a2684b7081a2fbf81b0 +size 92585563 diff --git a/3b_layer22_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer22_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b8758e30bd52e0fee6a1ce62030bf091aaa72fe --- /dev/null +++ b/3b_layer22_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ed8181899e1a889e7f5232446622fa7b34c41a08ccf5f302e56b2d99f43217 +size 30862944 diff --git a/3b_layer23_mlp.down_proj_output_reasoning_representation.pth b/3b_layer23_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a8405467a1c20576474d99b7f4dc50b7406fd281 --- /dev/null +++ b/3b_layer23_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9257e3ef9ef090e11334066a4f98440c26891e3b50c5b4f68c83ce01d5c68375 +size 92585553 diff --git a/3b_layer23_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer23_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..533c3237f3336f2d4dfe161b0009d72036c51428 --- /dev/null +++ b/3b_layer23_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1c133a74177d547e405d8341d87abdb1d265ea2d26da57e5ecd6f0f69a1297 +size 92585548 diff --git a/3b_layer23_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer23_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4fa1fbd7b656149ed8da338c986177718f7c4b73 --- /dev/null +++ b/3b_layer23_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649918977b54d3bf45fb98ce1fb772d7cd9eedeaeb6634ea0b8e2285164ca4d3 +size 92585563 diff --git a/3b_layer23_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer23_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..475c39db06579d1e37c3a2aaaf2111c946d76297 --- /dev/null +++ b/3b_layer23_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b300a253627c9af4a2ebb1d98b6828ad4f7ab0732054df2baf52d433efe6f6d4 +size 30862944 diff --git a/3b_layer23_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer23_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a82875c537d1ba1b46d23436bc6192c7f186bb0 --- /dev/null +++ b/3b_layer23_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16c6cbc675320f0b91b2eb163a350e3d4fbb791e171e945449fd351474c04a7 +size 92585563 diff --git a/3b_layer23_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer23_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8230e75d4f4dafb2ff1688ee97da02d3f03338fe --- /dev/null +++ b/3b_layer23_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727bfc441106628083cfdd1c981bfbdcf89347c27837c2fdca5b83f729502c59 +size 92585568 diff --git a/3b_layer23_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer23_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..47c2580496454981d0651d354c7563012e729007 --- /dev/null +++ b/3b_layer23_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934bfa4d420068a57e52ad2d586ae51404248ca37ae28609ffce89522182c5bd +size 30862944 diff --git a/3b_layer24_mlp.down_proj_output_reasoning_representation.pth b/3b_layer24_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..da32f4e98f967118ba895465e17ee558ff1d371a --- /dev/null +++ b/3b_layer24_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75da73d11b595583ed6ce7d4aa0a82091536060b3def843d3f3a63e8b89a6cc7 +size 92585553 diff --git a/3b_layer24_mlp.up_proj_input_reasoning_representation.pth b/3b_layer24_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5ac6cdf17f23074f8c5900437d2dd10c6650ba5 --- /dev/null +++ b/3b_layer24_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26b433b7c6f52349a80e4928193b6c021fa96a1f7f38c86b3e69dd8876dc655 +size 92585474 diff --git a/3b_layer24_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer24_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..80c514fabeec5268c88673d1996bc24c5b54a66b --- /dev/null +++ b/3b_layer24_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37f4f7fe7e7079f074f410aedb10d6e967feb19ce8af21df14f1b1dee4782d0 +size 30862944 diff --git a/3b_layer24_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer24_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc76888d68d39a0d5a874f64dbd1eb02e6a89e35 --- /dev/null +++ b/3b_layer24_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d6699e91c0cded49aa690fa3bd1a5640c3f63c12f1a843932fc4d57d0dcb98 +size 92585563 diff --git a/3b_layer24_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer24_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..994de23f7b6694092a2354cf319ece963b9072e3 --- /dev/null +++ b/3b_layer24_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac7ca954633dc93646e89875726ff7fbac99701a60306b0e70f680c33eafb3f4 +size 92585563 diff --git a/3b_layer24_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer24_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a47572ef4313b2fdcee7abedd1dda9f9933bc05 --- /dev/null +++ b/3b_layer24_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bafa7b40591207548464ccc5eab615392e14033676dcdab953fe9e55afcb2ee7 +size 92585563 diff --git a/3b_layer25_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer25_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..42b04d0d52c0425e86ff3f3dd7be38e235902b83 --- /dev/null +++ b/3b_layer25_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fee062c827adb7e70c409b508f36521860df860dd7c6dde20636c47db06a4fa +size 92585548 diff --git a/3b_layer25_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer25_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe7e331d1ab39355c67c89a4c070eb2be1db3c9b --- /dev/null +++ b/3b_layer25_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d77a7ca4fa87de78c3580efc216a2f397ffab99c51396190d9b22f3604043d +size 92585563 diff --git a/3b_layer25_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer25_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c95ea1b5ff068ad02bec4ea9130a505f67ad538d --- /dev/null +++ b/3b_layer25_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6eff982f22e218fadbe51df45285af60a64c892ca90f98731df2c1842b32f76 +size 30862944 diff --git a/3b_layer25_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer25_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..eefc240738b183ffbeb01222c61bee587983a2f4 --- /dev/null +++ b/3b_layer25_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5c266d9f4a3361e2a22915308f2ca92bf988233a726172a9f4725484cb7e6b +size 92585563 diff --git a/3b_layer25_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer25_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e81cfb7d9c1dbe410ad60d159621614915292452 --- /dev/null +++ b/3b_layer25_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38e427862d43a904de73a895f8f96a8eea00077c86e607c3354abe8fa2d6fa3 +size 92585568 diff --git a/3b_layer25_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer25_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd766c943f5e76a6d0586236a3e89894c74f7516 --- /dev/null +++ b/3b_layer25_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a590391d438420adc35aa286efb529624857da0ebda2b74494908cb7b160dc6f +size 92585563 diff --git a/3b_layer25_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer25_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..57afe208bb589028abb382e45c22474263ad3f84 --- /dev/null +++ b/3b_layer25_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ec87c6aef50df46d5d5acc76f962d88a85ab4c57e27ceac31a1b785e66dc89 +size 30862944 diff --git a/3b_layer26_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer26_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c0b7203ad33accd67b16f932cb2f5ce19792c61 --- /dev/null +++ b/3b_layer26_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51edfbeddd1b5a1ee40b25a8aa52cb3fda8c3e020485be5c201f73845de08dd +size 30862944 diff --git a/3b_layer26_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer26_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..561beecc3f5ce8715f4596d21c8a8ac2ab3d03bb --- /dev/null +++ b/3b_layer26_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ae5d867174945da9615626934eeef58ff9b535454cdea0a2222ce08cb7c35e +size 92585563 diff --git a/3b_layer26_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer26_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e071f9db6659b86b430a73158e17068636f0a9ed --- /dev/null +++ b/3b_layer26_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b973fd89c619c87c2357a0937e9493919cc963161cd21075fdc5879f7eaef73f +size 92585563 diff --git a/3b_layer27_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer27_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac79672374c826808eac333cbfcac79c3fbb89dd --- /dev/null +++ b/3b_layer27_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc2d414e609229443821aaacdde7cc15649dd589ef2ede2ae709e09a0a58cf4 +size 92585548 diff --git a/3b_layer27_mlp.up_proj_input_reasoning_representation.pth b/3b_layer27_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d8ab9bf270a5f54619b7ce98dff794b2ec27f539 --- /dev/null +++ b/3b_layer27_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc8f66756e8c8bc8b4f94250fd40869c83e49abd338062e81a7f9955e8bf98e +size 92585474 diff --git a/3b_layer27_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer27_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f51f4d1ec1c478b6d727100d9c9e635502cff1c0 --- /dev/null +++ b/3b_layer27_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b32e064dbbf5117420bdb2d9f8ddc2663b78e0ede6edb1a70e33b0f08251f3 +size 92585563 diff --git a/3b_layer27_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer27_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..be067ff6c24467304829946c88ffe3647b6ea9b9 --- /dev/null +++ b/3b_layer27_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af4e8ebbad31c00203d3e0263e32e10f54327cb1b4b5b695543b824d896e241 +size 92585568 diff --git a/3b_layer2_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer2_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..70cd67c95bb35fa82b2c09fae1758a7e30e8e92b --- /dev/null +++ b/3b_layer2_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313f702664d452d59999054c565e0615699d0706e9fc7958be1bbc83811df276 +size 92585543 diff --git a/3b_layer2_mlp.up_proj_input_reasoning_representation.pth b/3b_layer2_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e7c7dec434200122bb0fef684c1741d5d6c08ee --- /dev/null +++ b/3b_layer2_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1f0dc528441d3c8f8a14e46d832fb685c5e4f6bd205b5032133d5285fb41412 +size 92585469 diff --git a/3b_layer2_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer2_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f15157924320db49d6480d9190934bfb4849c0dd --- /dev/null +++ b/3b_layer2_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5311ab951677a2d98f0f5b2954cc3171691f113f6c1ecb31608276f5fd81ed87 +size 92585563 diff --git a/3b_layer3_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer3_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..173bad2e2e5d9cecf1bb3b3bb21809ebf749416b --- /dev/null +++ b/3b_layer3_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09afb0056034e7bc01302ee1ffb348f93453a90c6d5e3108fe831a288e24662a +size 92585543 diff --git a/3b_layer3_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer3_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..21227b79b529baa3ca845aa24ef9c8a0d59da08e --- /dev/null +++ b/3b_layer3_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b7d4b5100d7bfc028ebcad1e4f79140de166519ac5f7a1e810b58dac825c2d +size 92585558 diff --git a/3b_layer3_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer3_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9cb9eaab786006e728cdb5b893f9819a0e30da3b --- /dev/null +++ b/3b_layer3_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e866bb79c7b22759411f8d8a4d344fee19e84cb96fd5a97abbbafaf0a0648fc +size 92585558 diff --git a/3b_layer3_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer3_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7b87fa88e875faffff48748ea3436469660b971 --- /dev/null +++ b/3b_layer3_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1ba73f941f1ae7ff7cad768a476e7ee4b550366a19fb0fbb131e607f8a6ee2 +size 30862939 diff --git a/3b_layer4_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer4_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fecd2d55cf4f94e6167ff8f6b09eeaf19428f6a9 --- /dev/null +++ b/3b_layer4_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6671bb982c8194a256d49d930a57aa86a2e4bd26beb091ef79a9fae115f6a9b8 +size 246892108 diff --git a/3b_layer4_mlp.up_proj_input_reasoning_representation.pth b/3b_layer4_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..da3adb66d10471e10c98660b7a4d7e37412e3134 --- /dev/null +++ b/3b_layer4_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86b18b64a0c1cd668fff25bab8b41c69c5281477bd4eb66f63818fd9a412045 +size 92585469 diff --git a/3b_layer4_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer4_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..477b48d15d4a31584d86d0482179103671e9e23b --- /dev/null +++ b/3b_layer4_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a7e9f646d4753e13f740e18f6e36ab4feba5ebbb760999baeb18d6f0b2477eb +size 92585558 diff --git a/3b_layer4_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer4_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b791757055e919a3fd6a3297e1bb45a0409007c9 --- /dev/null +++ b/3b_layer4_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8754997e0add3d9ecd4fcad0934adb79be627bc161df73317ab74f4a60dc2212 +size 30862939 diff --git a/3b_layer4_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer4_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dba6e10adc18d71df42d602e560f24c991ff048c --- /dev/null +++ b/3b_layer4_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a409d9778bbfd0d547c6064bd670b81e756e587f8e0bb080b43ef9ff7ab1798e +size 92585563 diff --git a/3b_layer4_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer4_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ac6b6b8ca2a648fbad5a4d503e221944a5e7108 --- /dev/null +++ b/3b_layer4_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6b75e699221a64006a291249cc5a3801e13ef2c0b4095f531cf1be1adddf83 +size 92585563 diff --git a/3b_layer4_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer4_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b6d2971c2c1e703e320ff9304f8f856e0d5e4cd --- /dev/null +++ b/3b_layer4_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8338b7de807e95489a9a4d218e839f932b1cd2379360fdc1d1cbf5b87a63c05 +size 30862939 diff --git a/3b_layer5_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer5_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..07311ebf7f362cbdd55f8bad0178aa2b3b74f5c3 --- /dev/null +++ b/3b_layer5_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55faedb8f1e18747b802eaec6f431a32aaa6da357ea36ed468479e21e9e523cc +size 30862939 diff --git a/3b_layer5_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer5_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf42ed8bb213020f939fab631a736ec8752ada69 --- /dev/null +++ b/3b_layer5_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1130a4c36f7c2ca616f0c6611b249d0c3d6ea2b9a536f84c792fe15ebc186cd7 +size 92585563 diff --git a/3b_layer5_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer5_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d4449c078627acbca0ae3f701bc8363f15b88e4 --- /dev/null +++ b/3b_layer5_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e595701c11ed561f75c91696647fa3fa51d2945da63daead7f2a04bb7cec538 +size 92585558 diff --git a/3b_layer5_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer5_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e97d9d7f8127067747ce43dec536e2084b212992 --- /dev/null +++ b/3b_layer5_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c8fe8dbcccb32aa772e7dfa0669a6e8c2276c3cc35d17783b65ce7d91d3158 +size 92585563 diff --git a/3b_layer5_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer5_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c344b6f06538842a9dbc353a847c152fd00392ae --- /dev/null +++ b/3b_layer5_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c76c679c3741206102ce9e404a9324fce89f5343efda9cbce0632bbc92044d +size 30862939 diff --git a/3b_layer6_mlp.down_proj_output_reasoning_representation.pth b/3b_layer6_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..badf3922360b3026a696f27327de41b98fa233d3 --- /dev/null +++ b/3b_layer6_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697a947ff8df103e647f254a79a14e81d80612066a7fe2646a128f8922716b40 +size 92585548 diff --git a/3b_layer6_mlp.up_proj_input_reasoning_representation.pth b/3b_layer6_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d615490625cbe7ebf2f483455c9ee695712c10c9 --- /dev/null +++ b/3b_layer6_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:213e1e1bebfcb442161db60c7e293ef6a77ea5f6c253448067d8f831a4c13a59 +size 92585469 diff --git a/3b_layer6_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer6_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d5bb0db6605570e141cc0f7a4fa0b77f68829c9 --- /dev/null +++ b/3b_layer6_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2fe64246bb138d31eff3da5cc0c7d2bd284490d0460935e77b6cd919d7da02a +size 92585563 diff --git a/3b_layer6_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer6_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..80be1c7e49578b6998fe27f4dfd23f049a7b90dc --- /dev/null +++ b/3b_layer6_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1600edf3d81f96cbcb280dfe1a675abba006b1569dcf7876b02e0aa6049d1530 +size 92585558 diff --git a/3b_layer6_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer6_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..487320318ab42fff95261cecbc3215a6ca7d5231 --- /dev/null +++ b/3b_layer6_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ba569172ef577a4eff236aebd24b334053b4e5e8c8deb95242c17a1040d674 +size 92585563 diff --git a/3b_layer6_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer6_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..06bf5e64e48c58ee59ced55833e52b90fb3f345f --- /dev/null +++ b/3b_layer6_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0950a5a55555087674d8d824da1b59ca5ed0050306a45309780c2451604fc681 +size 92585558 diff --git a/3b_layer7_mlp.down_proj_output_reasoning_representation.pth b/3b_layer7_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4faeacb947855daa0ff83b35873d5cff90a1f5e9 --- /dev/null +++ b/3b_layer7_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a477b4fe8cb8f860722a4915511347056d0d33a26f99a5646b8ba52592bfd9 +size 92585548 diff --git a/3b_layer7_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer7_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7726f8229d0d9ceace91150e7aff3f0812905376 --- /dev/null +++ b/3b_layer7_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6a74fb378c5be765424aa0ce428a535f538cb70a8dcec47a0bbec33a0ba966 +size 92585543 diff --git a/3b_layer7_mlp.up_proj_output_reasoning_representation.pth b/3b_layer7_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0318dda967004a4d64ae503dd7f7b24cf7b6e8f --- /dev/null +++ b/3b_layer7_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dad3d60ab0c8ddc83a7f1a16b5658c090f5b537000342ba32da603f4c16c7a0 +size 246892034 diff --git a/3b_layer7_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer7_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..95acee6846c51629872e2a7221228a36568aa1c2 --- /dev/null +++ b/3b_layer7_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b8b9feb40b94fe847a9da55572beac2fe656c7964aef720133ef9fa03f293b +size 92585558 diff --git a/3b_layer7_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer7_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3551aac41f9d8e5c43585d2953610f7f8b653e22 --- /dev/null +++ b/3b_layer7_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2c811de132156ada5b59dd3fcd2b7f6d3434f0ea2f5f9451b994ad6d18aa88 +size 92585558 diff --git a/3b_layer7_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer7_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea0d2231d042edca098f4c843e68cc27cacae0a3 --- /dev/null +++ b/3b_layer7_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef0a52ab8f84162682bcfd238b6b6bdd1fc3d579ae83a90afad552f3a206df8 +size 30862939 diff --git a/3b_layer8_mlp.down_proj_output_reasoning_representation.pth b/3b_layer8_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bd40817c93ff987a9285852740647857b5b23c2e --- /dev/null +++ b/3b_layer8_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2cdde93a13fe7c1a500e096833bb86b9bf71f0f6abe1ab93d58b44f218150d +size 92585548 diff --git a/3b_layer8_mlp.up_proj_input_reasoning_representation.pth b/3b_layer8_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..84d978a5412457f0d8164030149e96a8f2866413 --- /dev/null +++ b/3b_layer8_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34897ee34fd8fa17404fd101241a58747d4cd610a163f6fb2e577740202ffd5f +size 92585469 diff --git a/3b_layer8_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer8_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a0f9922f814c1df2b3ad393b620c889c86f076c --- /dev/null +++ b/3b_layer8_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e11460ddacf4351dc391ec897f381260e23ec3f6d1a4e7a3ae804dc9abc988a +size 92585558 diff --git a/3b_layer8_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer8_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d81744e8ca6a0523e896f80f3f23b4bd2c09a0ea --- /dev/null +++ b/3b_layer8_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5541b859d843ad60cf12496136e5c422c531ab1456e14551bc56ab8c07e181 +size 30862939 diff --git a/3b_layer8_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer8_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1280fed779aadc746accab2123c890d87d770328 --- /dev/null +++ b/3b_layer8_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:490076b789f828e8691228f2f7606afcdd0775b97dd174c807e2ed9181bdebce +size 92585563 diff --git a/3b_layer9_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer9_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd5c83ecc7acf3d6165fd646e83fc6ac652b81d2 --- /dev/null +++ b/3b_layer9_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:152ac28e07dbfcc63da6b4c553668bd9bb19d4311255cb438e74304b14c2df16 +size 92585543 diff --git a/3b_layer9_mlp.up_proj_input_reasoning_representation.pth b/3b_layer9_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..588532ce5d6ce8fb4accdb6bcceed755f5f91924 --- /dev/null +++ b/3b_layer9_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21a97bcc2e7d3e28c1bab4b67d6f2b56f96fa4ad9944c46cf8906b09217c55a +size 92585469 diff --git a/3b_layer9_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer9_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f6ff17b080c7f7ecc9c68bb0cd5cd5c8824bc633 --- /dev/null +++ b/3b_layer9_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721fd0d3b0c332a6ac25635d655b9238e3b8282ab7830cc8459726b1f629c899 +size 92585558 diff --git a/3b_layer9_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer9_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a92ba4ad050220cd42b03d6a62d9c5167ba14ab8 --- /dev/null +++ b/3b_layer9_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d7f1646245ddaa800618082e4551d644031e9706fd33e1c2656c9dacf8b6bd +size 30862939 diff --git a/3b_layer9_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer9_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a95e9501daa2a68a9636bb375b96f4f176c23731 --- /dev/null +++ b/3b_layer9_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecea5dc6964d7bf8f006cb9100075bf5cf71dda7fd651fda735f7ddaee803cd2 +size 92585558 diff --git a/3b_layer9_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer9_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..23a62ac88124427ca3b7d70d31603acd9aed2239 --- /dev/null +++ b/3b_layer9_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45ab5e4419985136c492478c82671fb716d752adf659dc87aaf635acb47256c0 +size 92585563 diff --git a/3b_layer9_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer9_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f4984c060a169c4006d4c3c24f30374eb98dfc4 --- /dev/null +++ b/3b_layer9_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4544e4d3eaa8632573548e295ea260e32c8f38e20590913609543ce3b2e42746 +size 92585558 diff --git a/3b_layer9_self_attn.v_proj_output_reasoning_representation.pth b/3b_layer9_self_attn.v_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7350b8322884142549f454255a2cfca7d745321c --- /dev/null +++ b/3b_layer9_self_attn.v_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1faff9141f3d795a9005cf1e7c887a645a47c1fc3dff24e3f08357fa6a2c795 +size 30862939