diff --git a/attn_out_all/layer_0_width_16k_l0_small/params.safetensors b/attn_out_all/layer_0_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dded89e46766886daf1b194301d6bf9b78ce57bc --- /dev/null +++ b/attn_out_all/layer_0_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1cdd8a1978f80c435593185bb6a1a684b2b92cf4f07ffd30cfd6d6f7a8dd9f6 +size 537018752 diff --git a/attn_out_all/layer_0_width_262k_l0_big/params.safetensors b/attn_out_all/layer_0_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..469705bac6a5b8f42cad7b5fc1daa9b6f5c1c50f --- /dev/null +++ b/attn_out_all/layer_0_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb5bf2ede2b0339dc0676b51098cfdf9ad73c69b5d9d3bdba18861a0a78a78e +size 8592048520 diff --git a/attn_out_all/layer_0_width_262k_l0_small/params.safetensors b/attn_out_all/layer_0_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98841c96024e0f1df04c60e632c641045d789c36 --- /dev/null +++ b/attn_out_all/layer_0_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:508160e5228665c3f33c8edc21dc5601057d4cd2b5665caf9b81f8020cc8b698 +size 8592048520 diff --git a/attn_out_all/layer_11_width_16k_l0_small/params.safetensors b/attn_out_all/layer_11_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..adec64ee166ae0ab9b384c0a48b99887e5e1d2b1 --- /dev/null +++ b/attn_out_all/layer_11_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10f20da0742c95978538dfeb50e456d0c8e8ac4a2929c45dedf3beb60bbdc41 +size 537018752 diff --git a/attn_out_all/layer_11_width_262k_l0_small/params.safetensors b/attn_out_all/layer_11_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9748639b97659fed6b8b24afb99b54c32a3f12fc --- /dev/null +++ b/attn_out_all/layer_11_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c9780242f055238a5b05db5de8d3692217bb902535d51605e0e596bd49abdb +size 8592048520 diff --git a/attn_out_all/layer_12_width_16k_l0_big/params.safetensors b/attn_out_all/layer_12_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..59a141be5ce7fe6dd9ca743a683dbdaef0727232 --- /dev/null +++ b/attn_out_all/layer_12_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d74833b8be78a67ff0fece44b3ad203780fcd40ff8020a190b14fbffaab7ded +size 537018752 diff --git a/attn_out_all/layer_13_width_16k_l0_big/params.safetensors b/attn_out_all/layer_13_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b60db7f6b113091083bfc50b140faab5c03a04d8 --- /dev/null +++ b/attn_out_all/layer_13_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f23372c373e83a8fb84ccd18026b84f543f89f8700880d83b879218ab91a3e +size 537018752 diff --git a/attn_out_all/layer_13_width_16k_l0_small/params.safetensors b/attn_out_all/layer_13_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b885a15d5eed14648bd64d544c862181aef7453a --- /dev/null +++ b/attn_out_all/layer_13_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d27ba05072021d7dcf64b4a77d5125dde511b5f6c9da775e7de05d5e10c6066 +size 537018752 diff --git a/attn_out_all/layer_13_width_262k_l0_small/params.safetensors b/attn_out_all/layer_13_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38056e802e8310c64a8a0d716642f11ce511d426 --- /dev/null +++ b/attn_out_all/layer_13_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15c16f5f97caeebe52515eea9352e3c79cbfe5a9fd3e18875790e6ecdfab348 +size 8592048520 diff --git a/attn_out_all/layer_14_width_16k_l0_big/params.safetensors b/attn_out_all/layer_14_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..226bdec30ac6584260ed51ea0168c76f3a3235a7 --- /dev/null +++ b/attn_out_all/layer_14_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ff8c30a34fea80e0bba8447cad56935c4f46d01fa506600ed549625fc31bc0 +size 537018752 diff --git a/attn_out_all/layer_14_width_16k_l0_small/params.safetensors b/attn_out_all/layer_14_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56f8eee5ee6d2e6c2ae054096c493ad52e234e65 --- /dev/null +++ b/attn_out_all/layer_14_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8db77ae72f998111fcb6a0c0984a480dec30f2b859d0a8b881658db267fd82 +size 537018752 diff --git a/attn_out_all/layer_15_width_16k_l0_big/params.safetensors b/attn_out_all/layer_15_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6fdabbc9bc061e850445366c8e9f6655d2aab6b --- /dev/null +++ b/attn_out_all/layer_15_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e8b116239e9daad2c0a080a13d9240dc90e1c149bf7ea3bef04d5402a9bbdb3 +size 537018752 diff --git a/attn_out_all/layer_15_width_16k_l0_small/params.safetensors b/attn_out_all/layer_15_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1268e2820163a3d1383d6c6227bf46095a10d510 --- /dev/null +++ b/attn_out_all/layer_15_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313133cf3ea9699c985bfad31d6e50b5582c3ef39a4b5cd58a1f9064e5c70c8a +size 537018752 diff --git a/attn_out_all/layer_15_width_262k_l0_big/params.safetensors b/attn_out_all/layer_15_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..48352568d131d7e9ff7d03ff1fff32d0bec89cc5 --- /dev/null +++ b/attn_out_all/layer_15_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be58a7e22b5872fcd59ab060dffc31fda392e8bc84c962772300245c8776f6fc +size 8592048520 diff --git a/attn_out_all/layer_16_width_262k_l0_small/params.safetensors b/attn_out_all/layer_16_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd9dd3bfbb0db8a86a08630761fed076f4737ef9 --- /dev/null +++ b/attn_out_all/layer_16_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df2a5dc1905ba9b7ec0a32d130110ebdf918fb99e73054c60e5ec4df2e673ec +size 8592048520 diff --git a/attn_out_all/layer_18_width_16k_l0_big/params.safetensors b/attn_out_all/layer_18_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efd6e20393338d8ff5fd3ad588555524081efaea --- /dev/null +++ b/attn_out_all/layer_18_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b82df191e84f51f9a34912eca180a968e2f9f03fd21243c971d9acff8ca69b4 +size 537018752 diff --git a/attn_out_all/layer_19_width_16k_l0_small/params.safetensors b/attn_out_all/layer_19_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e74d3baba739c265bd706f3a7a058a2e660ccdc --- /dev/null +++ b/attn_out_all/layer_19_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab1c9796bba8736de06caa37cbb369b1337ea66b4efea18a1f4252e57f416e8 +size 537018752 diff --git a/attn_out_all/layer_1_width_262k_l0_small/params.safetensors b/attn_out_all/layer_1_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ddee7c41869f9a7df8126382ce0aa2328ccc9088 --- /dev/null +++ b/attn_out_all/layer_1_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a34f0ee4d048c4fcd0596b8f9cb8e31b469c80c10ca1d1959120c0e1c9990bb +size 8592048520 diff --git a/attn_out_all/layer_20_width_16k_l0_small/params.safetensors b/attn_out_all/layer_20_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..738aa92e52216b6239d3a9bbdab0c0d482f0dcba --- /dev/null +++ b/attn_out_all/layer_20_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0057b78755714c475fe76ef2db3d6fc339c18a9979cc27fbfc1916ef24123367 +size 537018752 diff --git a/attn_out_all/layer_20_width_262k_l0_small/params.safetensors b/attn_out_all/layer_20_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..947b488ea20149a72030c1784aeb1c3ddf7e0ece --- /dev/null +++ b/attn_out_all/layer_20_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ad2d156b0b9c5d0a24174a2a2a7d74313222f8cad7f7489370425a887e441a +size 8592048520 diff --git a/attn_out_all/layer_21_width_16k_l0_small/params.safetensors b/attn_out_all/layer_21_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..26425841ce646c8dad547eb739b9b0fac27e1351 --- /dev/null +++ b/attn_out_all/layer_21_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73ad0cf131385ea23bf6c364d01038d49af36b20e37a864fdcd2e526762ca7d +size 537018752 diff --git a/attn_out_all/layer_21_width_262k_l0_big/params.safetensors b/attn_out_all/layer_21_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..27310e76349917d51d27f81380917458290512cf --- /dev/null +++ b/attn_out_all/layer_21_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb08d9aa661d05ead0a2f5afd9c8d98ba774060d91994712082ff6754a1353a9 +size 8592048520 diff --git a/attn_out_all/layer_22_width_16k_l0_small/params.safetensors b/attn_out_all/layer_22_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7de26603cd53389f746cfd61be34c42653de034b --- /dev/null +++ b/attn_out_all/layer_22_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6c53980a17c705262c4ba6583d3293925ee0637fc4b1e71c079fdd150be96a +size 537018752 diff --git a/attn_out_all/layer_23_width_262k_l0_small/params.safetensors b/attn_out_all/layer_23_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5144dac3ca761a56d461d3d9a73f6d0056ef68c --- /dev/null +++ b/attn_out_all/layer_23_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f81f3617abf6078cff0fdd985ac0a472dfbc8612eba7a22ca980d0c2e3e11ec +size 8592048520 diff --git a/attn_out_all/layer_24_width_16k_l0_small/params.safetensors b/attn_out_all/layer_24_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7c7ae43de79b0ad4355f91659c9c16ecea41f6e --- /dev/null +++ b/attn_out_all/layer_24_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e41cc790eff31800213245b08a0c16ae628ec7c9ca89cb808a8ab43d17a86b6 +size 537018752 diff --git a/attn_out_all/layer_24_width_262k_l0_big/params.safetensors b/attn_out_all/layer_24_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86fb0535bd182bf168d93c234084d8d7eb02a41b --- /dev/null +++ b/attn_out_all/layer_24_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b9314f43f209a4d61780fa332bef32d8a4f1c0212d9352f8324e21d4e672c6 +size 8592048520 diff --git a/attn_out_all/layer_25_width_16k_l0_big/params.safetensors b/attn_out_all/layer_25_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9059e39a34643de8ae63ecb981b23c69e366ee9f --- /dev/null +++ b/attn_out_all/layer_25_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01464d96c80d2d8176d6156d5b885dfce71f2800aa980d87ece3d4c5783cc55e +size 537018752 diff --git a/attn_out_all/layer_25_width_16k_l0_small/params.safetensors b/attn_out_all/layer_25_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..003be52543f1508e9c371fdbcea45b1b5cb02bbd --- /dev/null +++ b/attn_out_all/layer_25_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c88d6170f502c4f00fc3831d2dc981ff65a31c4b3d3a6fd5d9955e34d10bbd +size 537018752 diff --git a/attn_out_all/layer_25_width_262k_l0_small/params.safetensors b/attn_out_all/layer_25_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3cb57e155b80e72f9efa525918182f232d5f3761 --- /dev/null +++ b/attn_out_all/layer_25_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747a01693ab1c7a3eeb55733274fa0f6271f423eb6d6d7eb0a447716e029d7b7 +size 8592048520 diff --git a/attn_out_all/layer_26_width_16k_l0_small/params.safetensors b/attn_out_all/layer_26_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2d9852b1a3cf192fd449b5d2e5905918a2817e5 --- /dev/null +++ b/attn_out_all/layer_26_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33916168408e6923a94b4dfaa35f917012cd0c7f5093ce675ac9572f9ecc401f +size 537018752 diff --git a/attn_out_all/layer_26_width_262k_l0_big/params.safetensors b/attn_out_all/layer_26_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9229e05b6fdeb49aa2d310e7bfd9e8e4bb69348 --- /dev/null +++ b/attn_out_all/layer_26_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b169418ec04017d785ad900576e22017d8fa46a68e466d5322684d6d05970d +size 8592048520 diff --git a/attn_out_all/layer_27_width_16k_l0_big/params.safetensors b/attn_out_all/layer_27_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16d8607ef19b8127e425a6661de98ac54d1b49f6 --- /dev/null +++ b/attn_out_all/layer_27_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59651e2dc9022d1d636a95b43b50faa183cca6adc324c26b1041f2b4109bee6a +size 537018752 diff --git a/attn_out_all/layer_27_width_16k_l0_small/params.safetensors b/attn_out_all/layer_27_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cf40631c6135ef15bd04a9f5776de1dbb861340 --- /dev/null +++ b/attn_out_all/layer_27_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4c2258e787abc44f66fdafb0a794a25b5fd122d4e1157007a7d7d52707b00a +size 537018752 diff --git a/attn_out_all/layer_27_width_262k_l0_big/params.safetensors b/attn_out_all/layer_27_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a40ed3c3b1d47b4497c39a0d9e3572228a6f622e --- /dev/null +++ b/attn_out_all/layer_27_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e607f10ca27a31cfccd46c3a2cc58ec4a2dcb38a6aad5c09c4934b61ede9c37 +size 8592048520 diff --git a/attn_out_all/layer_28_width_16k_l0_big/params.safetensors b/attn_out_all/layer_28_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60646f9b7182bbf1fb7a59810e8e025bad3c762d --- /dev/null +++ b/attn_out_all/layer_28_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853b1fc7daa05f50400cb8a9374389373feecc8b7279a6246b435efcb4027855 +size 537018752 diff --git a/attn_out_all/layer_28_width_16k_l0_small/params.safetensors b/attn_out_all/layer_28_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a7f74af76de730cb4af8fbd23b79455a2a007de --- /dev/null +++ b/attn_out_all/layer_28_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5113e7974d036c5369e540d4de38c07a77b6aed3cd070c8492374c2cbe3b0aab +size 537018752 diff --git a/attn_out_all/layer_29_width_16k_l0_big/params.safetensors b/attn_out_all/layer_29_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9f97e01f7aecff6012ffae96f6ab48e9447bb3c --- /dev/null +++ b/attn_out_all/layer_29_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33198da10d15dd8f20b1b0fa2944c25648705b4612e83f5904f0619571b67b72 +size 537018752 diff --git a/attn_out_all/layer_29_width_16k_l0_small/params.safetensors b/attn_out_all/layer_29_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e90381659d61252f8998e0e7fe0cf7ab4a01019 --- /dev/null +++ b/attn_out_all/layer_29_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9430d3798be83f6346a5f93f4787576b019d77dc1ace9729e7f37a414c6d60 +size 537018752 diff --git a/attn_out_all/layer_2_width_16k_l0_big/params.safetensors b/attn_out_all/layer_2_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3659eb6cb24c79dfd7f36d2e61879299a3f44aec --- /dev/null +++ b/attn_out_all/layer_2_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e2bd53f25bdadf185420933ca560b4500b92921af48640eb7b0d612c6e5477 +size 537018752 diff --git a/attn_out_all/layer_30_width_16k_l0_big/params.safetensors b/attn_out_all/layer_30_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..511c90221431a33a8c4fb81154d20617fe41b941 --- /dev/null +++ b/attn_out_all/layer_30_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588b84b514f5400b07df2a620405cfecab8728a05092f742a6c653236926fcb4 +size 537018752 diff --git a/attn_out_all/layer_31_width_16k_l0_big/params.safetensors b/attn_out_all/layer_31_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..773f8deafe2b0ea9164c1920d0befea51fcf0f95 --- /dev/null +++ b/attn_out_all/layer_31_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d324e4bb72413a393ecbc26b1e50635e32177964c757c52b90d25c75d55efb8f +size 537018752 diff --git a/attn_out_all/layer_31_width_262k_l0_big/params.safetensors b/attn_out_all/layer_31_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2dbbaa0e79fec20d01bc1526a7ddeb0f7260e63a --- /dev/null +++ b/attn_out_all/layer_31_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9aefbb0aa813adcb92e69d4ee13399f8944e7944b0f837a2252fe209dac6b57 +size 8592048520 diff --git a/attn_out_all/layer_31_width_262k_l0_small/params.safetensors b/attn_out_all/layer_31_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07e0e73e1b89bc70c578102434dce92c2f31b0f6 --- /dev/null +++ b/attn_out_all/layer_31_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b2fbd25c525e6c2c056ea4232a692f3d7c5d03b2e52dc038769f0e8b2b3e5e +size 8592048520 diff --git a/attn_out_all/layer_32_width_262k_l0_big/params.safetensors b/attn_out_all/layer_32_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb1e0f0025c4dbbf187715da7fbd79fa9e767d68 --- /dev/null +++ b/attn_out_all/layer_32_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7fc4f9675070eb6101153ae9b8b020e139afda67e9054bd3c51a239df349ca5 +size 8592048520 diff --git a/attn_out_all/layer_33_width_16k_l0_big/params.safetensors b/attn_out_all/layer_33_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..057138cd7e933359010643351e4549e59428e453 --- /dev/null +++ b/attn_out_all/layer_33_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7bc542e12bfe6902f4466bb7735f5413d31aaa7a849ccd7fb93dbe4df797dae +size 537018752 diff --git a/attn_out_all/layer_33_width_16k_l0_small/params.safetensors b/attn_out_all/layer_33_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c814537d98b4f265e80997fd53266b3dd5a7920c --- /dev/null +++ b/attn_out_all/layer_33_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb45aa6f9fb1100ce9f87573208bff4e7c61a9c2d9040cd1b4692ec6fb619f0 +size 537018752 diff --git a/attn_out_all/layer_35_width_16k_l0_small/params.safetensors b/attn_out_all/layer_35_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..186be3a68def0601ad8191365f69248f7d1018d4 --- /dev/null +++ b/attn_out_all/layer_35_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ca55534e112d00f17c87f755666f77d75a5831e220baf94b6721eacb70ce53 +size 537018752 diff --git a/attn_out_all/layer_35_width_262k_l0_big/params.safetensors b/attn_out_all/layer_35_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9fdc1f7bdb8b8b4a23db249e4ebaba8f7b657656 --- /dev/null +++ b/attn_out_all/layer_35_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7dfe5c982c20c2ff0ee9c90bc9df29fac32b38b11035cc0b21e19a83f56360 +size 8592048520 diff --git a/attn_out_all/layer_36_width_262k_l0_big/params.safetensors b/attn_out_all/layer_36_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d2a71f7a91dddb918098298cc3ffb6bbc9df58b --- /dev/null +++ b/attn_out_all/layer_36_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00db99a169ecbade2d64692372df93fe30ef5456370e2619a96ebe53e0a2565d +size 8592048520 diff --git a/attn_out_all/layer_36_width_262k_l0_small/params.safetensors b/attn_out_all/layer_36_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92e52210a1b48d1d7692e5231ebf4dd3f2c08635 --- /dev/null +++ b/attn_out_all/layer_36_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0bb0390002c214c31b87674cad59d7f7e203b843fe716a91aa3b4be1d9b7fa9 +size 8592048520 diff --git a/attn_out_all/layer_37_width_16k_l0_big/params.safetensors b/attn_out_all/layer_37_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1aa4d19ddd985f81e05ed6d9205f2a462f812c2f --- /dev/null +++ b/attn_out_all/layer_37_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762d8a21e0ec91f26a2f9ec1913ac538731bd381dcd8ee57065f94e96d1b7568 +size 537018752 diff --git a/attn_out_all/layer_37_width_16k_l0_small/params.safetensors b/attn_out_all/layer_37_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0f4f715ca20f7fa3ec1e66f0bf16df15b745c1c --- /dev/null +++ b/attn_out_all/layer_37_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47d9c1b6ac6c843a0c03f058220e06678041b2e1e084523be30dfafb5e698f2e +size 537018752 diff --git a/attn_out_all/layer_37_width_262k_l0_big/params.safetensors b/attn_out_all/layer_37_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..befeb0ff4d3ae4274350f2a5c496aa672f32f795 --- /dev/null +++ b/attn_out_all/layer_37_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e8bf45ebfe432fca39d2ca56fa0848b7f345433c135fc8c484b5bf071c187e9 +size 8592048520 diff --git a/attn_out_all/layer_38_width_16k_l0_big/params.safetensors b/attn_out_all/layer_38_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d09e7bd7076b8ba6382302293c7b990c35d21ed --- /dev/null +++ b/attn_out_all/layer_38_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe47f965d016094fe6c8475a514955a95ef68bceb1ee6f0139c54c1beca79076 +size 537018752 diff --git a/attn_out_all/layer_38_width_16k_l0_small/params.safetensors b/attn_out_all/layer_38_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce8e9998d94c382099ce620f93e3bbb7445269cf --- /dev/null +++ b/attn_out_all/layer_38_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55b852d4566c46faa7e6eefdc9b032479709ac15c027a4b4f6e422628a0449e +size 537018752 diff --git a/attn_out_all/layer_39_width_16k_l0_big/params.safetensors b/attn_out_all/layer_39_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6626cfc18eb4ede33cea49f5982eece8879d9f60 --- /dev/null +++ b/attn_out_all/layer_39_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4263c5f903ed6405fa71876e20b0c5aab07a92a5e8e3edc9084c0c39e8e09251 +size 537018752 diff --git a/attn_out_all/layer_39_width_16k_l0_small/params.safetensors b/attn_out_all/layer_39_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8dc0997273ebc48386ff2758adaee06d6587b2cf --- /dev/null +++ b/attn_out_all/layer_39_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd29f28cbeac72dad99e5acd0c683abe5b9083ecd02fed83c36f5e22d374158f +size 537018752 diff --git a/attn_out_all/layer_3_width_262k_l0_big/params.safetensors b/attn_out_all/layer_3_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..396446078d1a9d849b4c74e89be02878f052145f --- /dev/null +++ b/attn_out_all/layer_3_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bdde682a2f4d63148598eb138c9e5970bb7d9a8e9106b6863f846f4bf0b5d2d +size 8592048520 diff --git a/attn_out_all/layer_40_width_16k_l0_big/params.safetensors b/attn_out_all/layer_40_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fafd8a70397f5829b90b4b9b3a58f36d54c05490 --- /dev/null +++ b/attn_out_all/layer_40_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b845aed730c81921ed3da16170e3a0ddd4dd45efa5c93b0d0fa31352f38782d1 +size 537018752 diff --git a/attn_out_all/layer_40_width_16k_l0_small/params.safetensors b/attn_out_all/layer_40_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a82d02064e02570e9c79147dd0236c5f2957d9cc --- /dev/null +++ b/attn_out_all/layer_40_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd4c5ca5592f095d70db340e36604ba99f3d5e7cf6bfe4da8b425a15207747b +size 537018752 diff --git a/attn_out_all/layer_40_width_262k_l0_small/params.safetensors b/attn_out_all/layer_40_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..227df1b123c4c08249adff674bd5eabf60a5c68a --- /dev/null +++ b/attn_out_all/layer_40_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32a5088c87982f32b483be709598119976b4cd8e060bd011118f9a1cc24fb70 +size 8592048520 diff --git a/attn_out_all/layer_41_width_16k_l0_big/params.safetensors b/attn_out_all/layer_41_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47c8ee19fb836c52cf21825328d5fa6574ef5c60 --- /dev/null +++ b/attn_out_all/layer_41_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d56dec392e5dbb0e10b54622fea92819173c64987d1986795ba6f519d7cb76 +size 537018752 diff --git a/attn_out_all/layer_41_width_16k_l0_small/params.safetensors b/attn_out_all/layer_41_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb28b3529512a5c92b6f2f29b29e4c524537f188 --- /dev/null +++ b/attn_out_all/layer_41_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe7a3fc60463cc9466d06a3b4d513d29766cef6992ace5c6ab94e930a2fd7f8f +size 537018752 diff --git a/attn_out_all/layer_43_width_16k_l0_big/params.safetensors b/attn_out_all/layer_43_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ba71541d327055c767ea154a10f5a569562bf79 --- /dev/null +++ b/attn_out_all/layer_43_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27092dd065013bc7e685ec240a55e28ff3ac3ca9a6c7aa52b726df79316182f5 +size 537018752 diff --git a/attn_out_all/layer_43_width_16k_l0_small/params.safetensors b/attn_out_all/layer_43_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35357c9e41827f6a8296da250c4aca0ce53f1a5d --- /dev/null +++ b/attn_out_all/layer_43_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfd686011437a3d1c40c10b5cff691ec637a700f873566a163c1d7f687e92e7 +size 537018752 diff --git a/attn_out_all/layer_43_width_262k_l0_big/params.safetensors b/attn_out_all/layer_43_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..541e3f5c1dcdc9825034e2bac46325b425ed4e72 --- /dev/null +++ b/attn_out_all/layer_43_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee8d0c75c27d283f4cf53c828a8af57df6658cb4f6e07de0395f972c3907f37 +size 8592048520 diff --git a/attn_out_all/layer_44_width_16k_l0_big/params.safetensors b/attn_out_all/layer_44_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..318530bbda379e628b869234e5181ce5d32ccad1 --- /dev/null +++ b/attn_out_all/layer_44_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f402979078ce3fa0f9eaf6bffebf16c8e4d3cabda866287131f8d6e0cff614 +size 537018752 diff --git a/attn_out_all/layer_45_width_16k_l0_big/params.safetensors b/attn_out_all/layer_45_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2893e180f1b3934ea70e38aef0e977fd819290ad --- /dev/null +++ b/attn_out_all/layer_45_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836ef9434d5e58ccf947d9bd2dc94c815aac05ca1cb6471eb17922033b5cbd07 +size 537018752 diff --git a/attn_out_all/layer_45_width_262k_l0_big/params.safetensors b/attn_out_all/layer_45_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d105778802d1d038f7eb54b823bb9192fd4466f --- /dev/null +++ b/attn_out_all/layer_45_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c97493439d9d176d5fa56ae407e35f6a13c05394a4f7d71ed000fe0417da8c9b +size 8592048520 diff --git a/attn_out_all/layer_45_width_262k_l0_small/params.safetensors b/attn_out_all/layer_45_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94fa0de9e2c46b43c19615c290b2f4b969b7a791 --- /dev/null +++ b/attn_out_all/layer_45_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d4e027d091f4d23ec26885d3921bf37b3ba70cddcf329e2bb292a82de09b45 +size 8592048520 diff --git a/attn_out_all/layer_46_width_16k_l0_small/params.safetensors b/attn_out_all/layer_46_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..478dadfdfb6f96684ce3ea6f216c9c8d591c905b --- /dev/null +++ b/attn_out_all/layer_46_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855b9cc0208283abcd7b3b20c41c29b472a7b85c24c4187bc9dea8e9062756ea +size 537018752 diff --git a/attn_out_all/layer_47_width_16k_l0_big/params.safetensors b/attn_out_all/layer_47_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad0c828ac6adbabb148bbddd1eaaa2c32f598b64 --- /dev/null +++ b/attn_out_all/layer_47_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0614c46a34c21a599cf011b1a0785adf1ac505c04d427fb697970faa3bc41ac5 +size 537018752 diff --git a/attn_out_all/layer_47_width_262k_l0_small/params.safetensors b/attn_out_all/layer_47_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91187b9d49733127254e8068a5d8f764cee9b03b --- /dev/null +++ b/attn_out_all/layer_47_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0e90c49f0e366bee8b982f8c1102b6597e025f7458347dd02799d7a9062160f +size 8592048520 diff --git a/attn_out_all/layer_48_width_262k_l0_big/params.safetensors b/attn_out_all/layer_48_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ab03a523b4a392910be229beb5ca40751c3337b --- /dev/null +++ b/attn_out_all/layer_48_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c46fc466f8e30e74a9aa3cf384062adc6c0a7fb897f7c53c703feb5558acc3b +size 8592048520 diff --git a/attn_out_all/layer_49_width_262k_l0_big/params.safetensors b/attn_out_all/layer_49_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c97c6d143db446e497e17939b9f198460932415 --- /dev/null +++ b/attn_out_all/layer_49_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e042e4b2b89f6e64a6fa2f0f9de34fcd83e94960061518e4a45eee9532a7aa4 +size 8592048520 diff --git a/attn_out_all/layer_4_width_16k_l0_big/params.safetensors b/attn_out_all/layer_4_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..480a06eb3566f6206f2c1e40df784f96f3b4d7fc --- /dev/null +++ b/attn_out_all/layer_4_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce84033b230b6cbf425e1a3fd7ce5acb779e7c0c42132701e9b1eaa705759998 +size 537018752 diff --git a/attn_out_all/layer_4_width_16k_l0_small/params.safetensors b/attn_out_all/layer_4_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b2651c58054139b9c9f82c1544eed9336021cca --- /dev/null +++ b/attn_out_all/layer_4_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72cba2c13b31c8e75bf4ec271bb6d5449a0c339c5f94711d39ac0aad1a0fc1d9 +size 537018752 diff --git a/attn_out_all/layer_50_width_16k_l0_small/params.safetensors b/attn_out_all/layer_50_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f121600382583786a63686cef096738b4507606b --- /dev/null +++ b/attn_out_all/layer_50_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5dead284806d00bbe9b921fdb104d0a883be32541164415596d95dc4685badd +size 537018752 diff --git a/attn_out_all/layer_50_width_262k_l0_big/params.safetensors b/attn_out_all/layer_50_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a5d6ba42eb54a455738b30a04f8c78433c36906 --- /dev/null +++ b/attn_out_all/layer_50_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6f24ddfd8c9b27f53e0b74b6944fe4d647114e3024ec080ce88e589890b115 +size 8592048520 diff --git a/attn_out_all/layer_50_width_262k_l0_small/params.safetensors b/attn_out_all/layer_50_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..448bad4dfc29b54fb7af6adf37cc6dd902aa9595 --- /dev/null +++ b/attn_out_all/layer_50_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1889a908b8284afcadfdcd4c673714b9079c2c44252b04b2df411a0ce6d6c34f +size 8592048520 diff --git a/attn_out_all/layer_51_width_16k_l0_big/params.safetensors b/attn_out_all/layer_51_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3fa696eb3aa03e2c02479a08fe5ae19aec8d1e5 --- /dev/null +++ b/attn_out_all/layer_51_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f57ceceb2745f72af638a9b27ee076a355f2beed6e3967e3cd319e6d11913b +size 537018752 diff --git a/attn_out_all/layer_52_width_16k_l0_small/params.safetensors b/attn_out_all/layer_52_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..093ba0b77db36449e6a6d645f88dc1b5560213d5 --- /dev/null +++ b/attn_out_all/layer_52_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71edf782b28e7d6f6adc11f62c801d2e3ab13a787413f497da90ceb2c305f133 +size 537018752 diff --git a/attn_out_all/layer_52_width_262k_l0_small/params.safetensors b/attn_out_all/layer_52_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb0ac8c31038c5f7150e489cd05c0c6abd0c1ef6 --- /dev/null +++ b/attn_out_all/layer_52_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36836ae4f17f28f1e6c4715215407561c9ce10c7f8ae0a09342928e2da18da5b +size 8592048520 diff --git a/attn_out_all/layer_53_width_16k_l0_big/params.safetensors b/attn_out_all/layer_53_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b14f088384877f48e1052d2788bd4ba6a40469c2 --- /dev/null +++ b/attn_out_all/layer_53_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09462823179927f7b9cfa53b9900318dafa86fd42edc1203a78f8e081bc3be82 +size 537018752 diff --git a/attn_out_all/layer_54_width_16k_l0_small/params.safetensors b/attn_out_all/layer_54_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b29e385a12291b23b5e03f47b396705d84eb4f28 --- /dev/null +++ b/attn_out_all/layer_54_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59c7f3822c1651d3e6dc0763ef5cbce7600abeb9b72e154986a387db94fc87b8 +size 537018752 diff --git a/attn_out_all/layer_54_width_262k_l0_small/params.safetensors b/attn_out_all/layer_54_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cef29eac9b298ba3dcc949e03147e0a0a09f9136 --- /dev/null +++ b/attn_out_all/layer_54_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db81091ba617fa8b5a6977d4669ff94a5221d45ee43722ed74e7f633e90e376 +size 8592048520 diff --git a/attn_out_all/layer_55_width_16k_l0_big/params.safetensors b/attn_out_all/layer_55_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..501edc3dc61a16cbcb6fafb848a0eff43f1754fc --- /dev/null +++ b/attn_out_all/layer_55_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5e8d4ad03275794e598a9b60ed66d120e6adccff3745b1ae9233f53569489b +size 537018752 diff --git a/attn_out_all/layer_55_width_16k_l0_small/params.safetensors b/attn_out_all/layer_55_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5626410d6b99356c31566cdc210ee7f4540ef94 --- /dev/null +++ b/attn_out_all/layer_55_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb404fb85a5788fbfff2edcfc63b3a4170c498f48f4dc5f0279bb3a24d438229 +size 537018752 diff --git a/attn_out_all/layer_55_width_262k_l0_big/params.safetensors b/attn_out_all/layer_55_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f48149629ce7aa9f6cb31550aa7d10a3ccd3d548 --- /dev/null +++ b/attn_out_all/layer_55_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a50710a44b3b48674c056dcae00c17c7b4c1dd71c64fa2aaba4d8713f64b784 +size 8592048520 diff --git a/attn_out_all/layer_55_width_262k_l0_small/params.safetensors b/attn_out_all/layer_55_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c0661e1ecd28965ce39eb92032c403bf4d0b683 --- /dev/null +++ b/attn_out_all/layer_55_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b5d71e95b0cb39c21c91be2cdba4c0fb5983a4adb964e71d5111166a3df4f5 +size 8592048520 diff --git a/attn_out_all/layer_57_width_16k_l0_big/params.safetensors b/attn_out_all/layer_57_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..27cdef250e7efb32107be7ff4911aa454da6446c --- /dev/null +++ b/attn_out_all/layer_57_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090dd181f8faa68916c28f17a4e7e9d55416045e8b0eec1d885925e2ec2d36b1 +size 537018752 diff --git a/attn_out_all/layer_57_width_16k_l0_small/params.safetensors b/attn_out_all/layer_57_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f14930827ebb2b3a78e358bbedf0974e27a6c6c --- /dev/null +++ b/attn_out_all/layer_57_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d118c1434db7d77ffc2a1537be6d1d7e1df573f6001221bcd14c9be333105bac +size 537018752 diff --git a/attn_out_all/layer_57_width_262k_l0_big/params.safetensors b/attn_out_all/layer_57_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dd48625fdd1ba282094d2adad0383b853581381 --- /dev/null +++ b/attn_out_all/layer_57_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5916c8484274f9e6a6e61a2b1afa87ccad22da754cedfc582bfd4a0f712fd34d +size 8592048520 diff --git a/attn_out_all/layer_58_width_16k_l0_big/params.safetensors b/attn_out_all/layer_58_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3c9ab0c3acb3004dd57eb03e36a46ddaf37f38c --- /dev/null +++ b/attn_out_all/layer_58_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2f5f8d1b64d1d2e90eb2daf2082957250f71d4326c8d8021e92b3e95281926 +size 537018752 diff --git a/attn_out_all/layer_58_width_16k_l0_small/params.safetensors b/attn_out_all/layer_58_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..28645fbef3bd7555573d86ecf68fc349ea06d8a5 --- /dev/null +++ b/attn_out_all/layer_58_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde63ce6068a4744d4c1d8ff0148f570f68bee9242dba25e73ba118008193d54 +size 537018752 diff --git a/attn_out_all/layer_58_width_262k_l0_big/params.safetensors b/attn_out_all/layer_58_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..447665ec60f6249dce51d8631975482c542deb7d --- /dev/null +++ b/attn_out_all/layer_58_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca35f355625a328da9c4dd84adbfc18291c325b25f4c4b263eb012531b4fa64 +size 8592048520 diff --git a/attn_out_all/layer_59_width_16k_l0_small/params.safetensors b/attn_out_all/layer_59_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f925c5aff02c14c3288cc858ae45caef8df3b69 --- /dev/null +++ b/attn_out_all/layer_59_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af181de5bb20b5be719b1e8b3c561ae8167b290820584dbcf6af9b662d151ce +size 537018752 diff --git a/attn_out_all/layer_59_width_262k_l0_small/params.safetensors b/attn_out_all/layer_59_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24465a4e2ddab89907e177aa35276bd35b703c76 --- /dev/null +++ b/attn_out_all/layer_59_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f32412b01e128b7b1b5279790f2e433bfa72a9f9982b1457d5afc3e9c38de9 +size 8592048520 diff --git a/attn_out_all/layer_5_width_16k_l0_big/params.safetensors b/attn_out_all/layer_5_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e09752f13237d8c4eae9f10d72de421af0e8a36 --- /dev/null +++ b/attn_out_all/layer_5_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b18068d0e4211678607470722a5c6ae259c7da189cb70ba9eb3b3abd98dc78 +size 537018752 diff --git a/attn_out_all/layer_5_width_262k_l0_big/params.safetensors b/attn_out_all/layer_5_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b508d485129d83cad7b890bcc269fc81b1840fc --- /dev/null +++ b/attn_out_all/layer_5_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b6b0a4f99f41e3ce1dfa021045dba55752c2dc50a6181c683b715fd58f031f +size 8592048520 diff --git a/attn_out_all/layer_60_width_16k_l0_big/params.safetensors b/attn_out_all/layer_60_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0964c2e6aa898ea675d6148cd69e4b11ca9b6648 --- /dev/null +++ b/attn_out_all/layer_60_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e056df59d8c8caba7ca3fc11c54378af61f27b308fb02ee9a15016d83f0829 +size 537018752 diff --git a/attn_out_all/layer_60_width_16k_l0_small/params.safetensors b/attn_out_all/layer_60_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..818889ba6c94a9b3037769cd973fa821741c40b8 --- /dev/null +++ b/attn_out_all/layer_60_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57e907ac9cd973d18da5dbd4296294e6cd306374c024e4a157631de6b3a05f6 +size 537018752 diff --git a/attn_out_all/layer_60_width_262k_l0_big/params.safetensors b/attn_out_all/layer_60_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e95d40907d42cb32e0bdfcc74c4db60a3fbf2ed0 --- /dev/null +++ b/attn_out_all/layer_60_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1d23e2f1b42fffdf63298c9b1d98f5c9b759f4737ca2252f5b167d21ce5c43 +size 8592048520 diff --git a/attn_out_all/layer_61_width_16k_l0_big/params.safetensors b/attn_out_all/layer_61_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06e8a28ff507c53e527d15e211eeb857a6f92507 --- /dev/null +++ b/attn_out_all/layer_61_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:883738c85bb664458a8e7cd92c81b7f571789c5eb7ed8ec342404404c45dedf9 +size 537018752 diff --git a/attn_out_all/layer_61_width_262k_l0_small/params.safetensors b/attn_out_all/layer_61_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ac3e26acc31b05e95f23de58a24e0a71f9df508 --- /dev/null +++ b/attn_out_all/layer_61_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5bfd7d668e8f3f023451ddbbc5d5e4917ab5aa887dd3b71cfb36e0a882a5f8 +size 8592048520 diff --git a/attn_out_all/layer_6_width_16k_l0_small/params.safetensors b/attn_out_all/layer_6_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7fc4dbc829e218c883ef2d66bfa223e6cb864979 --- /dev/null +++ b/attn_out_all/layer_6_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4076144d43071485391004243b3873c29c1998eb9d49742bfefcf7c54c38d052 +size 537018752 diff --git a/attn_out_all/layer_7_width_16k_l0_big/params.safetensors b/attn_out_all/layer_7_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ef8f3e72e28a823912681c90fc53cfef06ab5d4 --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ceea9ade5186505d3f6033a1ee97b46e9bfba8d165a6319e9a5d4cf283490db +size 537018752 diff --git a/attn_out_all/layer_7_width_16k_l0_small/params.safetensors b/attn_out_all/layer_7_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a89d1db91a79bd8058304d0e6dff2e18ed6cbb66 --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa136cfdbfc1b85041d58f4a5326caaa939a961e59263dc8a886f70fe9e0aac +size 537018752 diff --git a/attn_out_all/layer_8_width_16k_l0_small/params.safetensors b/attn_out_all/layer_8_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5fe564bd5d0a4b6f667cf24e0d572b1c529cf27a --- /dev/null +++ b/attn_out_all/layer_8_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80a08e31bbbb1cd77df6380fff4d5dabd280d7cdd7b431e938be309a24ceefd +size 537018752 diff --git a/attn_out_all/layer_8_width_262k_l0_big/params.safetensors b/attn_out_all/layer_8_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d146967350c1e0bda5a67d990deb61324910babc --- /dev/null +++ b/attn_out_all/layer_8_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b6d5a4936fd54544816daf9282ce00f045164dfbe3579192a384183b4a52de +size 8592048520 diff --git a/attn_out_all/layer_8_width_262k_l0_small/params.safetensors b/attn_out_all/layer_8_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b7befd3b0ba839b190c4df5720cc489cb6275903 --- /dev/null +++ b/attn_out_all/layer_8_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8120280e0fac75b3bcd4402cd8f90fb0e1a04e0a4923ccc2baba551581d38bd9 +size 8592048520 diff --git a/attn_out_all/layer_9_width_16k_l0_big/params.safetensors b/attn_out_all/layer_9_width_16k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0419c73b3c114e8e343920be053c9435db1d09a --- /dev/null +++ b/attn_out_all/layer_9_width_16k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3211e473239035a255aa49343743e99710e1fb2f198c9c0e73a527f9d5b64dc2 +size 537018752 diff --git a/attn_out_all/layer_9_width_16k_l0_small/params.safetensors b/attn_out_all/layer_9_width_16k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69514ae0ddbf5611c754e2df3a2d2289edb992a0 --- /dev/null +++ b/attn_out_all/layer_9_width_16k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f22833a941643e846c3d3ca969e994509ee1c405d5c3982288ab096deb017074 +size 537018752 diff --git a/attn_out_all/layer_9_width_262k_l0_big/params.safetensors b/attn_out_all/layer_9_width_262k_l0_big/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..707ee57b56f20bb396f1bcd15558079534b805e9 --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_big/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e8bbbba247871da34f66330ebe32a2c1297b0aca30d2d51a1d6f067aea5ec4 +size 8592048520 diff --git a/attn_out_all/layer_9_width_262k_l0_small/params.safetensors b/attn_out_all/layer_9_width_262k_l0_small/params.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..709e3db181c60ef2725196d571d8d3d42b7d7d7a --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_small/params.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324717b3b44076a2dc0a1e4801422afcb08bc82c9f1e3e9e8a1de905443458dd +size 8592048520 diff --git a/mlp_out_all/layer_17_width_16k_l0_big/config.json b/mlp_out_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..382b6907736c7c6a0b6d726dbd6f7d6c59f5c6d1 --- /dev/null +++ b/mlp_out_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 109, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_big/config.json b/mlp_out_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1bf3859f6629ede614661cf78f5c47597219a385 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_32_width_16k_l0_big/config.json b/mlp_out_all/layer_32_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0a00fbe7f146b6c3793b969ad2b5dc6358b9d23 --- /dev/null +++ b/mlp_out_all/layer_32_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_33_width_262k_l0_big/config.json b/mlp_out_all/layer_33_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f0841eb58c8f23d46047cfdcca1a5f4daa6a480d --- /dev/null +++ b/mlp_out_all/layer_33_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_33_width_262k_l0_small/config.json b/mlp_out_all/layer_33_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df9c1c19bca17b6807aa4eb81d316da71c5f5478 --- /dev/null +++ b/mlp_out_all/layer_33_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_51_width_262k_l0_small/config.json b/mlp_out_all/layer_51_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..084c647ca8aaa67a97c6b5d4ee3c20cddcb57bbf --- /dev/null +++ b/mlp_out_all/layer_51_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.51.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_52_width_16k_l0_big/config.json b/mlp_out_all/layer_52_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..65dab70e38a387c41a66e3c09a9730a7142c52dd --- /dev/null +++ b/mlp_out_all/layer_52_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.52.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_56_width_16k_l0_big/config.json b/mlp_out_all/layer_56_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4bbfc9e40c5295833270391ba4bb118dedbcbc3 --- /dev/null +++ b/mlp_out_all/layer_56_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.56.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_61_width_16k_l0_small/config.json b/mlp_out_all/layer_61_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..74be07f793a894fe4c9c26cefbede3a88ac3eaab --- /dev/null +++ b/mlp_out_all/layer_61_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.61.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_262k_l0_big/config.json b/mlp_out_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7beafeaffe3650727e2543b06c08077f54ffd03c --- /dev/null +++ b/mlp_out_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 77, + "affine_connection": false +} \ No newline at end of file