diff --git a/mlp_out/layer_13_width_16k_l0_big/config.json b/mlp_out/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..06f440f768fce7c64ddb9dafd50689bd0938c337 --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_16k_l0_medium/config.json b/mlp_out/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c1878eeb5a3ecdc3d2556641a13df564981edba8 --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_16k_l0_small/config.json b/mlp_out/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6f2b7f13ac0ffea0c818be45b524c49da5f946bc --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_big/config.json b/mlp_out/layer_13_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..67026e3afbe03407061251814e22f3d879722311 --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_medium/config.json b/mlp_out/layer_13_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..93d4d08c5fb595c0f6ef3868a0795f8ebec55473 --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_small/config.json b/mlp_out/layer_13_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11805be270b8b340fc3ca549dee54163a2b41c12 --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_big/config.json b/mlp_out/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dd275352c68a21fbeb59a296094d91d08266d094 --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_medium/config.json b/mlp_out/layer_13_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5f45bc5d01bd4ec0f771691e0585a154151df5f0 --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_small/config.json b/mlp_out/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..00c0d432ab056e1e45c1e50d07bb67f8363d84f4 --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_65k_l0_big/config.json b/mlp_out/layer_13_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9820d727e9e5100a48dfb469c58fa65ec6c4772b --- /dev/null +++ b/mlp_out/layer_13_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_65k_l0_medium/config.json b/mlp_out/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..442244f82fd1fb4860d8a1e3e6d177fce13ddc04 --- /dev/null +++ b/mlp_out/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_medium/config.json b/mlp_out/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f001e2d3d8e02e059d8761e41e10f05a95094138 --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_small/config.json b/mlp_out/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f6e624b7429f7dff109cc7f3fb2caaab3c2d39b4 --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_big/config.json b/mlp_out/layer_17_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..79bbdfd33625cb7217a0b11ea7c753e11974550f --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_medium/config.json b/mlp_out/layer_17_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9055015b0ccdc91ff6d958a3cbf0ef761e7da5 --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_small/config.json b/mlp_out/layer_17_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9ea9db3aad76a887365ec8b5ce2c124da0ddce --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_big/config.json b/mlp_out/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dbaf318695181c9ee213fec8636dda8e17cd7c64 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_medium/config.json b/mlp_out/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d2bc6308580c9b573d5a719d4a09fc6c00cbb2b --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_small/config.json b/mlp_out/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0875bab86c3451f481168c8bfdfd26a0a392d567 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_big/config.json b/mlp_out/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..34c3c4d4676aeea5c9d4397d95ee21aadade1339 --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_medium/config.json b/mlp_out/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..03ffb48a926362b715dce96eb44e46715e04a1f8 --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_small/config.json b/mlp_out/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b44bce328568869b6a4b3f95e9c1ad7a5a404f1 --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_big/config.json b/mlp_out/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..42d1668c6287a27ca24b75e7a365e1cf9f87dc3f --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_small/config.json b/mlp_out/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..99bb55c527d77c0696472e6952a3d4594ecdff43 --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_big/config.json b/mlp_out/layer_22_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26ee80fc30d6a5d8958d43b92f2f78745d92223e --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_medium/config.json b/mlp_out/layer_22_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..55ab66c28c36d7bed09f253a62c86a7b05e73cda --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_small/config.json b/mlp_out/layer_22_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32e41832356dd72c96162f963a7cf94932babfd6 --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_big/config.json b/mlp_out/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a444aa23f15159dfc046bfd256d4f37c1899312 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_medium/config.json b/mlp_out/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..719c02767812c3130ffecf5203df12c0408412e3 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_small/config.json b/mlp_out/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c63a3af64b2e6f4c06c85d5558ac8d7faf9aa8f8 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_big/config.json b/mlp_out/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ece94fa4d5a8f58894f4070f2c99ef507c852a8 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_medium/config.json b/mlp_out/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3833b9f29cfecd77ae25cf67b6b14c7765293333 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_small/config.json b/mlp_out/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a944edb6cef46082e40c56fe69b8671edcac77d6 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_big/config.json b/mlp_out/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2eee1cf63579cc367413438a643d417c932afb8e --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_medium/config.json b/mlp_out/layer_7_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0667118db4d63925910b97aabf899ff1f92b398b --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_small/config.json b/mlp_out/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..518b67570495b7ba1eafba526546bbd6c96ab06b --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_big/config.json b/mlp_out/layer_7_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7c68f7bb32b7389da96aa59001843b3286213df5 --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_medium/config.json b/mlp_out/layer_7_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a343ed761c35368dd81d92ea94193a0490d8427e --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_small/config.json b/mlp_out/layer_7_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f89857d7f461a18536b9f7e72e6c1e86db4f0b8a --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_big/config.json b/mlp_out/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b143c4bae3371dde0bea53632d8bccba5eb0e46e --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_medium/config.json b/mlp_out/layer_7_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5237810270f93bd8b25d143cb348f9119df216fd --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_small/config.json b/mlp_out/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..91db45f316674abc99943ed3a0d52384d9c4a5fb --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_big/config.json b/mlp_out/layer_7_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..830f4bb2892a1a4a0dfdee402f5a7a52a050ece0 --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_medium/config.json b/mlp_out/layer_7_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6de78a90fd47a6b62909a5eeddbb7864e921cbb5 --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_small/config.json b/mlp_out/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..02f0ef74324e3c106a7f61ea73463b480f670179 --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_262k_l0_small/config.json b/mlp_out_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e26c8e4984761b2c70e43c0fd3acd32caa58fd8 --- /dev/null +++ b/mlp_out_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_big/config.json b/mlp_out_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d75711f850793425112c1b78387c11a61df4ce3 --- /dev/null +++ b/mlp_out_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_small/config.json b/mlp_out_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82b45fc29f0bd0aec49bec062a46c230288250f3 --- /dev/null +++ b/mlp_out_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_262k_l0_big/config.json b/mlp_out_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0d66532fed9ed8ccf27aed5102996035806864 --- /dev/null +++ b/mlp_out_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_262k_l0_big/config.json b/mlp_out_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b72833adfecd7264b0877248c1fcb950387a609b --- /dev/null +++ b/mlp_out_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_16k_l0_small/config.json b/mlp_out_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c41c138a57d7e7194755f834bd80f8d7bca14890 --- /dev/null +++ b/mlp_out_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_16k_l0_big/config.json b/resid_post_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f66f89d4bce2ddccca45d0d2e4eb7cd135f5a02 --- /dev/null +++ b/resid_post_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_16k_l0_small/config.json b/resid_post_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..432e91335ecf6d8b593fa00995a17b25cdb45af8 --- /dev/null +++ b/resid_post_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_big/config.json b/resid_post_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..169a3ae5f89cc0c88f471c788ebec3ce18162abe --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_small/config.json b/resid_post_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..34755b4e6f9ab224954735b2f870b64db2ae2931 --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_big/config.json b/resid_post_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..93befa6104379c07921c31161ee549b6751f0b9a --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_small/config.json b/resid_post_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..db5d0d2eaae710caec23804d37bf36174913f224 --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_big/config.json b/resid_post_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..021183aa7d251f3cf4f75f497d81f09939b500a2 --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_big/config.json b/resid_post_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..42e9d5f88a60acb72eea26d4292d3c8b24d8daba --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_small/config.json b/resid_post_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..46591fd46d723e0c16d9578783c2ef6d825c48e1 --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_262k_l0_big/config.json b/resid_post_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0dae0d43276533408991629423e07eb12989168c --- /dev/null +++ b/resid_post_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_262k_l0_small/config.json b/resid_post_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f02767a1b53a33aea63a51634ed618ac0fd7870 --- /dev/null +++ b/resid_post_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_small/config.json b/resid_post_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8cab39dbec7c5c224e8faff23529ab6de9ca63af --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_small/config.json b/resid_post_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..36e9582a3371be6fd6e2c4d884d2864134ab9e8e --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_big/config.json b/resid_post_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e2abb444838caaa7beb7dcb27e59e891bf8867f8 --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_small/config.json b/resid_post_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f38f0dff18921d9c05468979d3d032198a68d8a0 --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_262k_l0_small/config.json b/resid_post_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..55bca74fd31aa968cc66185590aac08611417ca6 --- /dev/null +++ b/resid_post_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_big/config.json b/resid_post_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff562d21684ec249455dff710e57c44828a6fd3f --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_small/config.json b/resid_post_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d3ba87886b9812781c236ae7823f8beeeaaa573 --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_262k_l0_big/config.json b/resid_post_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d20f685b3f712c8ca91a1c9608bc72592caa88c8 --- /dev/null +++ b/resid_post_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_262k_l0_small/config.json b/resid_post_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2cbf650b743ae4e695a454b2069e9146a596049d --- /dev/null +++ b/resid_post_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_big/config.json b/resid_post_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..efddf2f1ea6adfcdf0ac046d027d0f7008dc53b9 --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_small/config.json b/resid_post_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..38deae0930e20d825824e2760c0c6209131a0b32 --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_262k_l0_big/config.json b/resid_post_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f52d09558b05434784d90c826a7ccd28151d63b4 --- /dev/null +++ b/resid_post_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_big/config.json b/resid_post_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b4bb019473b59f7f003c503d4321e5bb6d3ca205 --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_small/config.json b/resid_post_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a460ccae5871f4556bf60c131de878d93f7a42f --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_big/config.json b/resid_post_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..65f55afe1f9307bd6a471e56cb68064752d1288b --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_big/config.json b/resid_post_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c611cdbb5ca8a8570a1da64019615d3caee3bd38 --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_small/config.json b/resid_post_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb69837ce3e6bd95b16a1c42a101b73f71828152 --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_big/config.json b/resid_post_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a1ea97fb24c63e98db05f1c6ec97bf494c35cb5a --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_small/config.json b/resid_post_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f02c05a9118efeb73ba22f7a2a23f6dad51b7f87 --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_big/config.json b/resid_post_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..97d8ba13b758858b7fa1806e417d85671308ecc6 --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_small/config.json b/resid_post_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..99149309745cd74ffc9b1bc77b89da90ccd27d73 --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_262k_l0_small/config.json b/resid_post_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d676817bbae1f04835a6367e2d02c1dd19b6a4a --- /dev/null +++ b/resid_post_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_16k_l0_big/config.json b/resid_post_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a20b92eed4278f8dedee306f37751574c44e0be --- /dev/null +++ b/resid_post_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_16k_l0_small/config.json b/resid_post_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..80907de5d05e9f45d810f09282e9940c4f4148a7 --- /dev/null +++ b/resid_post_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_big/config.json b/resid_post_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ea2cbb26b2bf5750b05ece1b030d66771ca6eef --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_16k_l0_big/config.json b/resid_post_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cccb46b1bea86aeb841e847d65497a8a212f4c1b --- /dev/null +++ b/resid_post_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_16k_l0_small/config.json b/resid_post_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f1a601bf6956d37b31eaa893e163f9c132a0403 --- /dev/null +++ b/resid_post_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_big/config.json b/resid_post_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7974448bf4bbfe1562c616e8071354cce9ede14b --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_16k_l0_big/config.json b/resid_post_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..64f7b6099e570d65eb7f0479d08a29d9ebc47db0 --- /dev/null +++ b/resid_post_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_16k_l0_small/config.json b/resid_post_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0f8ca6ac362914d7b014339a4deb1f3e19a2253d --- /dev/null +++ b/resid_post_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_262k_l0_big/config.json b/resid_post_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a26f439931fae44e5f02ef94d87618501ad2578d --- /dev/null +++ b/resid_post_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_16k_l0_big/config.json b/resid_post_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8ad1e5bb3d9f9621e7fb545c0f39fd2ced0197 --- /dev/null +++ b/resid_post_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_16k_l0_small/config.json b/resid_post_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..038e99bba97ab59dbd115fdc26285a4e931832bd --- /dev/null +++ b/resid_post_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_big/config.json b/resid_post_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..365fbede545e2f2ea83b1dde312f5a40bd73bf0b --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_small/config.json b/resid_post_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2401559c9d81d2bfe3dbf72a70a56aaabf40c922 --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_big/config.json b/resid_post_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bbac5d15e3380fddb1e9610a1a243da2eb1c3d39 --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_small/config.json b/resid_post_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf8b5ed96798de5bc53429174e0f87df3af7499c --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_big/config.json b/resid_post_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..348859956b8c9cd75ef8807181b9d57e5843d4f2 --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_16k_l0_small/config.json b/resid_post_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3c84cfbba6c1d3cf8149cd137fcf2e827b5e0606 --- /dev/null +++ b/resid_post_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_big/config.json b/resid_post_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c0e79077ff9303b407d1afcac6f42e9ef61c5b4f --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_small/config.json b/resid_post_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..93f41e01c01d9ed15dd0f28ac64681f3ad2976f9 --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_big/config.json b/resid_post_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dd2651fba85820afe3ba533bc6b30409d618e038 --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_small/config.json b/resid_post_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a9c186d1a8ad360ffeb0ab7cf6ab50765846ab06 --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_262k_l0_big/config.json b/resid_post_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ef30beaf605f7c7202f2ded7566f3ee50c6467a --- /dev/null +++ b/resid_post_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_small/config.json b/resid_post_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8af7d0528bf05093f93ba60c68091a527484b780 --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_big/config.json b/resid_post_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b639d673647db6bc37fdf196356d3967ce22da73 --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_small/config.json b/resid_post_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dc8ff17c759af114fc19de6e8bf31a616aae2b2b --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_big/config.json b/resid_post_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6bcf3d503d3c331b949269843ac69516a52716e2 --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_small/config.json b/resid_post_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c26e7e3a825eec5060a63cecf4ccb8b6dce1aa3c --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_262k_l0_big/config.json b/resid_post_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..94b06ea24ea43af1822ca444949297fae2f8f15b --- /dev/null +++ b/resid_post_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_262k_l0_small/config.json b/resid_post_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..220ac9fe59c103d4e134fa2b19acaa11a8c4f514 --- /dev/null +++ b/resid_post_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_big/config.json b/resid_post_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5336320b1dc9d5ff3db450b9b17c6b16f1802872 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_small/config.json b/resid_post_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6311cdaa55e7e51ad4f37dfcbca01146f42fcd4f --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_262k_l0_small/config.json b/resid_post_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8924bf7b1b442a654684143dcb145bbd80890b11 --- /dev/null +++ b/resid_post_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_big/config.json b/resid_post_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..177a324993683a86d26e0f927189bcdcf53a265b --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_big/config.json b/resid_post_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..31d11ec56da695dbddc2a9887c8ca8223efe825f --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_small/config.json b/resid_post_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e278d1d7fc35c29da139a13a2a3033f782770abd --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_big/config.json b/resid_post_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2627e9e78ba0915179f052c6beda5e020e6a70c5 --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_small/config.json b/resid_post_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..88aed33f3ad2a68ef27ba60c4a4aff987f229113 --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_big/config.json b/resid_post_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3fd9cef3828a3ed7fef95aed0d08624b05489d10 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_small/config.json b/resid_post_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..86ae383db73419ebc5d7c92fbdf016265d4bc058 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_big/config.json b/resid_post_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6ed8e01e0bf8f51b72367771041f40fbea19f7a3 --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_big/config.json b/resid_post_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6db77f6748cc51c426475f97688b0ec5d833b057 --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_small/config.json b/resid_post_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2008ceba8841bd88aa59210264b4676fac313c4d --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_262k_l0_small/config.json b/resid_post_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b3d7a8647cff84b252dc41d183b25474594e9dc --- /dev/null +++ b/resid_post_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_big/config.json b/resid_post_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a1f391220b7d3c71f345d8b81cac7405f7452e5 --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_small/config.json b/resid_post_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4e19afa9aecae5e63869d58ab39045486769274b --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_16k_l0_big/config.json b/resid_post_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bc8a296be3aa6833b42f2e852bf61ad1b968956b --- /dev/null +++ b/resid_post_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_16k_l0_small/config.json b/resid_post_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8dd1cb82a177c860feb07d4112831e6efa07d1e4 --- /dev/null +++ b/resid_post_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_big/config.json b/resid_post_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..de54a7c118b5f132da1d075f3c9e7e1c88e52be7 --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_small/config.json b/resid_post_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..876e1a41173f74fa425f8fc1485bec608341345e --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_big/config.json b/transcoder/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b10553c85440b7ece8186ad75286682f33e20b2e --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_big_affine/config.json b/transcoder/layer_13_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e76da9791510a193fe543ac678103e51f49ac4ec --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_medium/config.json b/transcoder/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5fac49223fd5bb2d3e84e5ebcf864195e0bea47f --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_medium_affine/config.json b/transcoder/layer_13_width_16k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ab9f5fe14209013c42446a29be9d174798451e3a --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_small/config.json b/transcoder/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..609dc0b3d134bfcd8cffeda85c5062937d072f71 --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_small_affine/config.json b/transcoder/layer_13_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d7dd78dff6af674dc65dee5d371adf3e37ada304 --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_big_affine/config.json b/transcoder/layer_13_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..75e22cc72a77fd7a4ec6a8bca93fb5de6bd5baec --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_small_affine/config.json b/transcoder/layer_13_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6aeabbd52e78b9637d4531eed4fb64966b989987 --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_big_affine/config.json b/transcoder/layer_13_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4487588be8e995dab557134e434216f51f299b89 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_medium/config.json b/transcoder/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f351689c34e76736d8f961b02051f46cc0e9966f --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_medium_affine/config.json b/transcoder/layer_13_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff45aba6acbc3319f7514fbdbac8166d927bd824 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_small/config.json b/transcoder/layer_13_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4bf23ae0b50cc5afee7a2ac16e4f2349d6d2d85 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_big/config.json b/transcoder/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..246e845c632e978224fef5860bd6f8e050306b98 --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_big_affine/config.json b/transcoder/layer_17_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d683c0797956a48b155b51fc7ead48e0ab0cb2e --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_medium/config.json b/transcoder/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c04f004b72e4b3ccffb2b39da37490471b7198db --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_big/config.json b/transcoder/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b0dfcb75be8d24dd32a0f6edd86f38804fd2db0b --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_big_affine/config.json b/transcoder/layer_17_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e41ff24df2d2cd2d617b195a9d4be3f9f37eb35b --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_small/config.json b/transcoder/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b310c6a8d7b84f67d719a2511fb285e996caa37b --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_small_affine/config.json b/transcoder/layer_17_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7dd0d13cfc778fced37e2b9f6aeb5732bf1db8cd --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_small/config.json b/transcoder/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4e450884bbefb9cd4ea578bfa9434f5e8e39ef24 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_small_affine/config.json b/transcoder/layer_17_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0c984d99279a818330a44dcb4e8a68aaa16b0db3 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_big/config.json b/transcoder/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..baa6f9a2c80888e0df6b7c5702d3e178e7765b1d --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_big_affine/config.json b/transcoder/layer_22_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ae3d31010d1c6c617754b2939840be59cbf7304d --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_medium/config.json b/transcoder/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82a3741afa0818266b9a5dc7bc90012badffdae6 --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_small/config.json b/transcoder/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e062af5a2532f0e8132e881710f147d80261381 --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_big/config.json b/transcoder/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..58fcbf4045b8d8483126a5ff4f69ed0f777a5dc0 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_medium/config.json b/transcoder/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..96cac5f7587fcc46c63b89bc11bbe5fac7fb55b0 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_small_affine/config.json b/transcoder/layer_22_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2fa14451a9912f451e5add06446688e7a89fc30 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_big/config.json b/transcoder/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..36b29186a65c448908ba1d6f7365b052b4353356 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_big_affine/config.json b/transcoder/layer_22_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0acacaf3e0ef5b727385f4ff648b24e9d50ee4f --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_medium/config.json b/transcoder/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..45e4ccd8387c3927e748f8412f2f7682bdcbe949 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_small/config.json b/transcoder/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9edd3060621ec237fccfb94dedd2de052b314feb --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_small_affine/config.json b/transcoder/layer_22_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..264716a9e154b1be5d08e09e511e834d9536d37f --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_big/config.json b/transcoder/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a94ae0ab2944acfd7787ac70b322c63a86e2198 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_big_affine/config.json b/transcoder/layer_7_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..65011ac76331cd3b6e1ab95b0bc30bcb9e6d92d4 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_small_affine/config.json b/transcoder/layer_7_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..537ffba7911d5b095604b110c4781c81878397a0 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_big/config.json b/transcoder/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8b91fa2fc23e1fa377142e8b6df0fbacc23f7e --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_big_affine/config.json b/transcoder/layer_7_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b0e7a9bd8c6bbe903890ea087873c3e276348f0 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_medium_affine/config.json b/transcoder/layer_7_width_262k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..55c03912715a1daf7dc21465ff2db134e5e8c75b --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_small/config.json b/transcoder/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1fb4f99bf47a3b3c91c6c6243b2a8b25840e63b5 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_small_affine/config.json b/transcoder/layer_7_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3d22e49d51a03efa3e3b7c79a871ffd62b088d69 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_big_affine/config.json b/transcoder/layer_7_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..271b88bb8c2ae3951a00a611d63e3272d66d3213 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_medium_affine/config.json b/transcoder/layer_7_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e16ce1b7dddeb778589daaccb912ac0442ec0516 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_small/config.json b/transcoder/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c6b05c468d2bfb3fee4bbdf41449b3b15de3de13 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_small_affine/config.json b/transcoder/layer_7_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea9190d396719e55fc6378cee2b42698e2768fea --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file