diff --git a/resid_post/layer_17_width_16k_l0_medium/config.json b/resid_post/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d88acc16ddfa9de21465c35fa1c2f2cee405c29 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_small/config.json b/resid_post/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..27cb1162cdc08d23f603748a40fd671fdb7d245a --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_small/config.json b/resid_post/layer_17_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26d2854976cdd300da6dc718f01e5f9ed1e3fa7e --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_big/config.json b/resid_post/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5a29d5db9ea186af0ac4caaef2427b56dde40be5 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_medium/config.json b/resid_post/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba7880855a5b4ace1c0df2f1bc04c50d291fd72 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba7880855a5b4ace1c0df2f1bc04c50d291fd72 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_small/config.json b/resid_post/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63c74698f908817a051d0aa221cbdc28b9eaa323 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_medium/config.json b/resid_post/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..863cec1344946051eed215df05e011e22cd310ac --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_big/config.json b/resid_post/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cc357d848822bdfa99898dad7606dde2cd78ac44 --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_medium/config.json b/resid_post/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..31169bb2a061d3d055cb0a97a03664fbc272ddf7 --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_big/config.json b/resid_post/layer_22_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..842d2a2adb460e02ee7c9a01156cbc7aa0688b04 --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_small/config.json b/resid_post/layer_22_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a393a84995d0d199d2a05c40a062aa6b0eb6d7a --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_medium/config.json b/resid_post/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb8289c36e3ef802001d473dc953f06af2fc476 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb8289c36e3ef802001d473dc953f06af2fc476 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_small/config.json b/resid_post/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8cd581ab41e9edb42bca2cb89ebaca304c5a4032 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_big/config.json b/resid_post/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b43f17be273dfb59ec6605252a2c61ff65b5672 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_medium/config.json b/resid_post/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f1fc2dc31ac7cce2a857682d81cf55a61c6e2cf1 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_small/config.json b/resid_post/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7dbc061b9d66e1dc438b147c8126ccd97608e728 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_16k_l0_big/config.json b/resid_post/layer_29_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..34108214a7321c6fd2abf82847a2fa6941545894 --- /dev/null +++ b/resid_post/layer_29_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_16k_l0_medium/config.json b/resid_post/layer_29_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9cab3e7e00ec7d4dd6faaff038b1640292888718 --- /dev/null +++ b/resid_post/layer_29_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_16k_l0_small/config.json b/resid_post/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e77c58a885087f4b5a5c0c31cfc1e027b38d2375 --- /dev/null +++ b/resid_post/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_1m_l0_big/config.json b/resid_post/layer_29_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..775c40590bcb6b32dc7cd08734d65b62026ab783 --- /dev/null +++ b/resid_post/layer_29_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_1m_l0_medium/config.json b/resid_post/layer_29_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1add0f9972a7f126e5288255504b5e8a77b123 --- /dev/null +++ b/resid_post/layer_29_width_1m_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_1m_l0_small/config.json b/resid_post/layer_29_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c100c224bb0d3948a83a313732cfeb5886560236 --- /dev/null +++ b/resid_post/layer_29_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_262k_l0_medium/config.json b/resid_post/layer_29_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..15257b42a7e37133943fa2e4a176982807490c0a --- /dev/null +++ b/resid_post/layer_29_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_29_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..15257b42a7e37133943fa2e4a176982807490c0a --- /dev/null +++ b/resid_post/layer_29_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_65k_l0_big/config.json b/resid_post/layer_29_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..217e98f28b533adf51f55712e8e27ca123b7eb0d --- /dev/null +++ b/resid_post/layer_29_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_65k_l0_medium/config.json b/resid_post/layer_29_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44e74428edf865cc6ea411fc2ae9b2d8c6f8e5ab --- /dev/null +++ b/resid_post/layer_29_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_65k_l0_small/config.json b/resid_post/layer_29_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aebfdf3ee77262a414c09af772ab8c95ec30849f --- /dev/null +++ b/resid_post/layer_29_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_big/config.json b/resid_post/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e54a89ac3bc5bf96ee94ba100ec0901a207491b6 --- /dev/null +++ b/resid_post/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_medium/config.json b/resid_post/layer_9_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c2dd6c04621c8f1c4f220163cb52bb2db26c0da6 --- /dev/null +++ b/resid_post/layer_9_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_big/config.json b/resid_post/layer_9_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1b82235b55ae55bb616cac65c0e782b8fe2b72 --- /dev/null +++ b/resid_post/layer_9_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 1048576, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_big/config.json b/resid_post/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd83bf3bec64718d8454001456da04e5fc1b36e --- /dev/null +++ b/resid_post/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_small/config.json b/resid_post/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b636e97b43673bf91d6100af82d55498aeabb0 --- /dev/null +++ b/resid_post/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_big/config.json b/resid_post/layer_9_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9a6d139c62769c3b2e5333bdedc112f3ca4ab515 --- /dev/null +++ b/resid_post/layer_9_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_medium/config.json b/resid_post/layer_9_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfa9650688393556bafa575fdb8203ba58c62eda --- /dev/null +++ b/resid_post/layer_9_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_small/config.json b/resid_post_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53e30ef030d06229075656e57c552a710dcafda3 --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_small/config.json b/resid_post_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..118fff1faf943f01143404addb3b6d63df10fe38 --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_small/config.json b/resid_post_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..801a3b65f1abb118f4fdd715d0ff4e74e359f547 --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_big/config.json b/resid_post_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f4bdab0d3c59f5c35b4f4b59e3960a3bbe49f4d --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 118, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_small/config.json b/resid_post_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c730179d62117c5c8a91d89fa6c214d008c4ac0 --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_small/config.json b/resid_post_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0fd2823cac298d5934ac42f753c9c71999ebc55 --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_small/config.json b/resid_post_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ca06def86b3491c5cf59fc00c795fb42ac23993 --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_big/config.json b/resid_post_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bc396535e17d2c872a2a8b759169ea1cc78a2251 --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_big/config.json b/resid_post_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8385059ce265d5ace68e81ad98ea616ee1725a08 --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_small/config.json b/resid_post_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63c74698f908817a051d0aa221cbdc28b9eaa323 --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_big/config.json b/resid_post_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..215b689cb7313e903bd84cc9e0b2b2cb37806396 --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_16k_l0_small/config.json b/resid_post_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..71684cfd6ecad212b36b55b70f3769d8a4dd9a64 --- /dev/null +++ b/resid_post_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_big/config.json b/resid_post_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8d4b970231df62c6011bcc986f68b6977af4a1da --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_small/config.json b/resid_post_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..902f0aca713ae5169752d2403000ec743490c268 --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_small/config.json b/resid_post_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e6913095100bbe0f098f5e7cfd9bd66af2c4fe6 --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_small/config.json b/resid_post_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8cd581ab41e9edb42bca2cb89ebaca304c5a4032 --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_16k_l0_small/config.json b/resid_post_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..65b1050b940a3b172d13919d832316e84d5d1097 --- /dev/null +++ b/resid_post_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_big/config.json b/resid_post_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ed6cb4bbe70d8773a6e383bf01a6fb5b4f6bd9 --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_small/config.json b/resid_post_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2d24ae2e804b4c5b4aee1606a1fc820f31c226ec --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_16k_l0_big/config.json b/resid_post_all/layer_26_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44389f574c4a6ce1684df34194fa31ae0fba1be2 --- /dev/null +++ b/resid_post_all/layer_26_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_16k_l0_small/config.json b/resid_post_all/layer_26_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..54c9510caf2497e9b610d1d7d9de46b9ae15ac14 --- /dev/null +++ b/resid_post_all/layer_26_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_262k_l0_big/config.json b/resid_post_all/layer_26_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..737e96bba494808c50c6d44669e327225857079b --- /dev/null +++ b/resid_post_all/layer_26_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_27_width_262k_l0_big/config.json b/resid_post_all/layer_27_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..050d66b9c9471686d3fdef412e14b30ff76ad610 --- /dev/null +++ b/resid_post_all/layer_27_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.output", + "hf_hook_point_out": "model.layers.27.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_28_width_16k_l0_small/config.json b/resid_post_all/layer_28_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef335a7b6df96dfdd825a72a17f4942356310be6 --- /dev/null +++ b/resid_post_all/layer_28_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.output", + "hf_hook_point_out": "model.layers.28.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_30_width_262k_l0_big/config.json b/resid_post_all/layer_30_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7434f4aec9d2baf22f872910990a534e2f639c2 --- /dev/null +++ b/resid_post_all/layer_30_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.output", + "hf_hook_point_out": "model.layers.30.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_30_width_262k_l0_small/config.json b/resid_post_all/layer_30_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..34550f3955b7c06c38ba96e25229abb9de6fa2f2 --- /dev/null +++ b/resid_post_all/layer_30_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.output", + "hf_hook_point_out": "model.layers.30.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_31_width_16k_l0_big/config.json b/resid_post_all/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dc02617b45bd6ae54dd2e245a90d4b09a55758c9 --- /dev/null +++ b/resid_post_all/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_31_width_262k_l0_small/config.json b/resid_post_all/layer_31_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..02fc60ee9d5a4b351c9616cd773fc4ee29e4286e --- /dev/null +++ b/resid_post_all/layer_31_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_32_width_262k_l0_big/config.json b/resid_post_all/layer_32_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..361dfd9041746b2d715a26107f6e5c41640996e0 --- /dev/null +++ b/resid_post_all/layer_32_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.output", + "hf_hook_point_out": "model.layers.32.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_32_width_262k_l0_small/config.json b/resid_post_all/layer_32_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef94930610d24e97d98d0c5cc90ff6eba8b46578 --- /dev/null +++ b/resid_post_all/layer_32_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.output", + "hf_hook_point_out": "model.layers.32.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_big/config.json b/resid_post_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e762170f7f5de37042feafaaa60bf27d0fdc4d20 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 75, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_262k_l0_big/config.json b/resid_post_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e624587bf8213eaee14c36aebb53b956f88a96e4 --- /dev/null +++ b/resid_post_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 75, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_big/config.json b/resid_post_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5043764d2a31d16ea191cc3555f76aa242a03d8 --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 81, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_big/config.json b/resid_post_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e97bf5bae6251cae491f4e71c7f1dcbd55c5805c --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 81, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_big/config.json b/resid_post_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e8daafef519eb1b7f6dfe7fb9ff5ec6a90ab54d5 --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 102, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_small/config.json b/resid_post_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f63c20aec681f7e9939f67bf65d89b4346f43b37 --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_262k_l0_big/config.json b/resid_post_all/layer_8_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..19f9e560283ce75268b36a04aa272417e6693157 --- /dev/null +++ b/resid_post_all/layer_8_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 102, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_262k_l0_small/config.json b/resid_post_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..127d11a42ca3fad2820212e7dd94ff40046e42a3 --- /dev/null +++ b/resid_post_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_big/config.json b/resid_post_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f7a04e45cdde525411a1b0ea83f9fc067148385b --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 107, + "affine_connection": false +} \ No newline at end of file