diff --git a/attn_out/layer_13_width_16k_l0_big/config.json b/attn_out/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae271298282819b3a20ad4c07e69176c7489225 --- /dev/null +++ b/attn_out/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_16k_l0_medium/config.json b/attn_out/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..981b3b9bf7fffed9bee947bbaf5e3ad3f7bfa65d --- /dev/null +++ b/attn_out/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_16k_l0_small/config.json b/attn_out/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..500846b0d33a5519a621d47139e78ec31ebd5bb9 --- /dev/null +++ b/attn_out/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_262k_l0_big/config.json b/attn_out/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..244459e8e4ab695f1677467a86c853ed94daca49 --- /dev/null +++ b/attn_out/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_262k_l0_medium/config.json b/attn_out/layer_13_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..960602807cc2e8e924de7e7ff2fb0a43c890facd --- /dev/null +++ b/attn_out/layer_13_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_262k_l0_small/config.json b/attn_out/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6dccee30bedf38049b62efc9cbe958ea714bdf --- /dev/null +++ b/attn_out/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_65k_l0_big/config.json b/attn_out/layer_13_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf6622b37559cd422e89cd2aa24f677b369f8a70 --- /dev/null +++ b/attn_out/layer_13_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_65k_l0_medium/config.json b/attn_out/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..778c7c6c256243f7a5f3e6144ce9b3625cbf4d61 --- /dev/null +++ b/attn_out/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_13_width_65k_l0_small/config.json b/attn_out/layer_13_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..346580f3171c80cd631ad17c2877e2e0fd95e52f --- /dev/null +++ b/attn_out/layer_13_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_16k_l0_big/config.json b/attn_out/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..46df263c6c0814f42a4ada8b845aa3894f76758e --- /dev/null +++ b/attn_out/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_16k_l0_medium/config.json b/attn_out/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0f21123e8836ad79c3f6315c026422cf8deb8860 --- /dev/null +++ b/attn_out/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_16k_l0_small/config.json b/attn_out/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..debf9269ec5c3e37db4542e705cae68ed9ecd53e --- /dev/null +++ b/attn_out/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_262k_l0_big/config.json b/attn_out/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d525d758c3a2144b783a5e10698577680778d91 --- /dev/null +++ b/attn_out/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_262k_l0_medium/config.json b/attn_out/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb8ec7c011ae4558353f6095be97f376fd1b9f62 --- /dev/null +++ b/attn_out/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_262k_l0_small/config.json b/attn_out/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b520f313a641530cf02a45988c19fd4abb62032 --- /dev/null +++ b/attn_out/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_65k_l0_big/config.json b/attn_out/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9422135e5b0f4817f9a2d34c68c72a506a8590f --- /dev/null +++ b/attn_out/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_65k_l0_medium/config.json b/attn_out/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..56d85b1501bffcf7e8e51b3261853824f66c81e2 --- /dev/null +++ b/attn_out/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_17_width_65k_l0_small/config.json b/attn_out/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1ca5906375da95c01035a9f938424d56e4d172a5 --- /dev/null +++ b/attn_out/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_16k_l0_big/config.json b/attn_out/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..145287ce14e323bee06ffed4f04ccb93f79109ea --- /dev/null +++ b/attn_out/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_16k_l0_medium/config.json b/attn_out/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3c70e1453217c74374c34205c4f3780735c1d15c --- /dev/null +++ b/attn_out/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_16k_l0_small/config.json b/attn_out/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec9968193bc180219026be8a00cedae6956ffbd5 --- /dev/null +++ b/attn_out/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_262k_l0_big/config.json b/attn_out/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3f4e9976c740f817150943737f16ed7d6b010a3a --- /dev/null +++ b/attn_out/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_262k_l0_medium/config.json b/attn_out/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ced504ce91aec2547c7f89a75dd6c9d5ef3d3a50 --- /dev/null +++ b/attn_out/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_262k_l0_small/config.json b/attn_out/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdae94c55c67fc947a77b8999adc477d0ff1115d --- /dev/null +++ b/attn_out/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_65k_l0_big/config.json b/attn_out/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e175297980d257d755b82243e0e1ae1e931a1777 --- /dev/null +++ b/attn_out/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_65k_l0_medium/config.json b/attn_out/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b184bf36c9132eb5af1c3d6f277642e0695dcce8 --- /dev/null +++ b/attn_out/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_22_width_65k_l0_small/config.json b/attn_out/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2536f79cbf187e341ab80280dc63d6ced8cda8 --- /dev/null +++ b/attn_out/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_16k_l0_big/config.json b/attn_out/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4b4cce06a87a51192ebbd016d3e3f37aaa4d34c --- /dev/null +++ b/attn_out/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_16k_l0_medium/config.json b/attn_out/layer_7_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a27c6b0a6a3360518f9c5fa87904b138ffe5781d --- /dev/null +++ b/attn_out/layer_7_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_16k_l0_small/config.json b/attn_out/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f4c6f95541f803539e40c3ee0849e489f79d5494 --- /dev/null +++ b/attn_out/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_262k_l0_big/config.json b/attn_out/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..28b61641937e651c97e543c8605deaac67466929 --- /dev/null +++ b/attn_out/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_262k_l0_medium/config.json b/attn_out/layer_7_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6ea8a826aea078cca4f895d553f0c990e566d5 --- /dev/null +++ b/attn_out/layer_7_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_262k_l0_small/config.json b/attn_out/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c8838e51473d06c1e1837829cbc61fbfc01eba --- /dev/null +++ b/attn_out/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_65k_l0_big/config.json b/attn_out/layer_7_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..989b453aed778841f25297a6ed98f4f3928f84ff --- /dev/null +++ b/attn_out/layer_7_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_65k_l0_medium/config.json b/attn_out/layer_7_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eccb27231051ab6b56c6512df6a6ae53840e76c5 --- /dev/null +++ b/attn_out/layer_7_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out/layer_7_width_65k_l0_small/config.json b/attn_out/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..361a465133442f8dec30afd0520280134887ded5 --- /dev/null +++ b/attn_out/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_0_width_16k_l0_big/config.json b/attn_out_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2ac3d6ed50f88d96c6928681d42e4557759cfd --- /dev/null +++ b/attn_out_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.0.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_0_width_16k_l0_small/config.json b/attn_out_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..47b70b920c00e33df23f85edb8b5be509a93c954 --- /dev/null +++ b/attn_out_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.0.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_0_width_262k_l0_big/config.json b/attn_out_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2fd40566b913f866a5d9316d4e8a3d8793145f88 --- /dev/null +++ b/attn_out_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.0.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_0_width_262k_l0_small/config.json b/attn_out_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b0ffcef791e010882c8a3938d28170af8fbbab0 --- /dev/null +++ b/attn_out_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.0.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_10_width_16k_l0_big/config.json b/attn_out_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82ee04aa357a7c6b824ddf752aafa275615f117e --- /dev/null +++ b/attn_out_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_10_width_16k_l0_small/config.json b/attn_out_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c391556aee01a699beb7d7e5808206a44caba05a --- /dev/null +++ b/attn_out_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_10_width_262k_l0_big/config.json b/attn_out_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd29758dd231bdb12c57ba10ea2b1f72336fc1b6 --- /dev/null +++ b/attn_out_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_10_width_262k_l0_small/config.json b/attn_out_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e84a541d4b4b0cad8fc01c99871dad4ecbe67b8f --- /dev/null +++ b/attn_out_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_11_width_16k_l0_big/config.json b/attn_out_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb3b9517e2d6b8eb6a9f088a6e8480ba8777ca3e --- /dev/null +++ b/attn_out_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_11_width_16k_l0_small/config.json b/attn_out_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5aba501c1da96b65bc742b71a6e7b7d547070935 --- /dev/null +++ b/attn_out_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_11_width_262k_l0_big/config.json b/attn_out_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3914ca479db0ac7558599467f68ea0678a714117 --- /dev/null +++ b/attn_out_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_11_width_262k_l0_small/config.json b/attn_out_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9a9da2a120b2fa260a2fd9aacd71d4cb3da36fe --- /dev/null +++ b/attn_out_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_12_width_16k_l0_big/config.json b/attn_out_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..30030e7b1f98813bd40c2c17d4a23c8aadf818fa --- /dev/null +++ b/attn_out_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_12_width_16k_l0_small/config.json b/attn_out_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a60e351084ae8270c796f5182e284d8c485109cf --- /dev/null +++ b/attn_out_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_12_width_262k_l0_big/config.json b/attn_out_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0de77ca0e37f12f1a722c5518ac00fe4f023a6ba --- /dev/null +++ b/attn_out_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_12_width_262k_l0_small/config.json b/attn_out_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0535ac3e2275b83dfd598593da4baf06319a599a --- /dev/null +++ b/attn_out_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_16k_l0_big/config.json b/attn_out_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f978ed56e3320ba2a75f0296eede4134470c45a3 --- /dev/null +++ b/attn_out_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_16k_l0_small/config.json b/attn_out_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..500846b0d33a5519a621d47139e78ec31ebd5bb9 --- /dev/null +++ b/attn_out_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_big/config.json b/attn_out_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fda7198538f7d24f4aa2d8404e7632022b7bbe8f --- /dev/null +++ b/attn_out_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_small/config.json b/attn_out_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6dccee30bedf38049b62efc9cbe958ea714bdf --- /dev/null +++ b/attn_out_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_14_width_16k_l0_big/config.json b/attn_out_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5f9d4d917bb61999d213e490f2bbb93566977b08 --- /dev/null +++ b/attn_out_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_14_width_16k_l0_small/config.json b/attn_out_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b0c6ad5f832da05df950fac735139ea57d3eaab --- /dev/null +++ b/attn_out_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_14_width_262k_l0_big/config.json b/attn_out_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2625634509fb13ee091133e365540ceafd96e465 --- /dev/null +++ b/attn_out_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_14_width_262k_l0_small/config.json b/attn_out_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b003c6513083af0cfdd4e713070275619408e665 --- /dev/null +++ b/attn_out_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_15_width_16k_l0_big/config.json b/attn_out_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d371e5d8a30bb73f329e60cb6bd646e47fc1bb26 --- /dev/null +++ b/attn_out_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_15_width_16k_l0_small/config.json b/attn_out_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d490369f24c927b15d1bfdbdf1c487a6445569e --- /dev/null +++ b/attn_out_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_15_width_262k_l0_big/config.json b/attn_out_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..14fe34e075a4fbf5783b51258344ebaea87e911e --- /dev/null +++ b/attn_out_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_15_width_262k_l0_small/config.json b/attn_out_all/layer_15_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b4332624291695d3f14c9ad173b2cb398e33e049 --- /dev/null +++ b/attn_out_all/layer_15_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_16_width_16k_l0_big/config.json b/attn_out_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b4fd268f828811d23a0966525c36d0568cdaa1 --- /dev/null +++ b/attn_out_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_16_width_16k_l0_small/config.json b/attn_out_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b1c8e13950c17ac224c0e08d0abe09f14ef83be --- /dev/null +++ b/attn_out_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_16_width_262k_l0_big/config.json b/attn_out_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9a53c1bd89137e3492fa66b0397262080050dc --- /dev/null +++ b/attn_out_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_16_width_262k_l0_small/config.json b/attn_out_all/layer_16_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b9a931a437bbad80171a089cb4ba60c1ca8db2b --- /dev/null +++ b/attn_out_all/layer_16_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_17_width_16k_l0_big/config.json b/attn_out_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..012cb6bdd736619ef5de91ba235376eca45c54e1 --- /dev/null +++ b/attn_out_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_17_width_16k_l0_small/config.json b/attn_out_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..debf9269ec5c3e37db4542e705cae68ed9ecd53e --- /dev/null +++ b/attn_out_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_17_width_262k_l0_big/config.json b/attn_out_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5afd1d6d61721a5e7f92ecd977f27b74228a0c6f --- /dev/null +++ b/attn_out_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_17_width_262k_l0_small/config.json b/attn_out_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b520f313a641530cf02a45988c19fd4abb62032 --- /dev/null +++ b/attn_out_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_18_width_16k_l0_big/config.json b/attn_out_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cce45dbadd5c4477f887a87b292745a494acdd51 --- /dev/null +++ b/attn_out_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.18.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_18_width_16k_l0_small/config.json b/attn_out_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..22f53cba457b194856e23b269890880a1de8127e --- /dev/null +++ b/attn_out_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.18.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_18_width_262k_l0_big/config.json b/attn_out_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b4d44e74d10572e59e5440f4f05dd83a5ee3177 --- /dev/null +++ b/attn_out_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.18.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_18_width_262k_l0_small/config.json b/attn_out_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..20c7022fa27bccfb217e9380d5f2dc2360ce4cf5 --- /dev/null +++ b/attn_out_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.18.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_16k_l0_big/config.json b/attn_out_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a33871217d6219bd568798b9ccb475e82411ea5 --- /dev/null +++ b/attn_out_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_16k_l0_small/config.json b/attn_out_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c63ef4bfb0fa9d8f4606476588f58cb697c76a9c --- /dev/null +++ b/attn_out_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_262k_l0_big/config.json b/attn_out_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b9def85a85f41470e5fafa78aae04d7398b97f1f --- /dev/null +++ b/attn_out_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_262k_l0_small/config.json b/attn_out_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdf8f14ae28e50a7d0eae86a973c7b88e8e13fb7 --- /dev/null +++ b/attn_out_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_1_width_16k_l0_big/config.json b/attn_out_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b38cdd771f11ba7e60c9620cf39c90c36c1ff8e --- /dev/null +++ b/attn_out_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_1_width_16k_l0_small/config.json b/attn_out_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..13e957fc58a6a52438277c6041c0667f6622a5b2 --- /dev/null +++ b/attn_out_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_1_width_262k_l0_big/config.json b/attn_out_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..adabcf060e4ec61f09138beffa0b3278db02a006 --- /dev/null +++ b/attn_out_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_1_width_262k_l0_small/config.json b/attn_out_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fbda872f537ddaa36a115c7517288c0f9cb46520 --- /dev/null +++ b/attn_out_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_20_width_16k_l0_big/config.json b/attn_out_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..89abbb9d90525305c029a0a3b07541d03c1ebb74 --- /dev/null +++ b/attn_out_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.20.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_20_width_16k_l0_small/config.json b/attn_out_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..960f96dc105bcfc2883f563328554a261efb4b6a --- /dev/null +++ b/attn_out_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.20.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_20_width_262k_l0_big/config.json b/attn_out_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aaa807be9e644b86fccbb46f032a252cefae6b42 --- /dev/null +++ b/attn_out_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.20.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_20_width_262k_l0_small/config.json b/attn_out_all/layer_20_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0254ee7d14c27d6b13da6c91fb15489715d0f1d3 --- /dev/null +++ b/attn_out_all/layer_20_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.20.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_16k_l0_big/config.json b/attn_out_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed0043bda51add47ddea5b0722a2923c642b744 --- /dev/null +++ b/attn_out_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_16k_l0_small/config.json b/attn_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b9e40740532628bbef177263f41c829162ac0f5 --- /dev/null +++ b/attn_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_262k_l0_big/config.json b/attn_out_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0c96a0cb8127970f2d6fb06699d9620bbf0b0d0c --- /dev/null +++ b/attn_out_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_262k_l0_small/config.json b/attn_out_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ebfc7467b3331a72183a1dac9db9833a4cbbb027 --- /dev/null +++ b/attn_out_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_22_width_16k_l0_big/config.json b/attn_out_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8fe6cdaf0c1055d65a62bca4111176d71f3e5611 --- /dev/null +++ b/attn_out_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_22_width_16k_l0_small/config.json b/attn_out_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec9968193bc180219026be8a00cedae6956ffbd5 --- /dev/null +++ b/attn_out_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_22_width_262k_l0_big/config.json b/attn_out_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..696c0feef280e459d3b7cec55c79e8a500224214 --- /dev/null +++ b/attn_out_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_22_width_262k_l0_small/config.json b/attn_out_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdae94c55c67fc947a77b8999adc477d0ff1115d --- /dev/null +++ b/attn_out_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_23_width_16k_l0_big/config.json b/attn_out_all/layer_23_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5950bc63837902bbbca9b515f614ba46aeae7fb4 --- /dev/null +++ b/attn_out_all/layer_23_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.23.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_23_width_16k_l0_small/config.json b/attn_out_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..afcaa55444cea05d84df52b9b5161bbd5d4e4d28 --- /dev/null +++ b/attn_out_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.23.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_23_width_262k_l0_big/config.json b/attn_out_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4c2c1a2c2f85d36c908e1fdf5cd2fa2fe74a3be6 --- /dev/null +++ b/attn_out_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.23.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_23_width_262k_l0_small/config.json b/attn_out_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b468e6f1ff7fa4ef40d34a7a6329505fa2b91fb --- /dev/null +++ b/attn_out_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.23.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_16k_l0_big/config.json b/attn_out_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..105a439017ad6b8e123fced945ddc535d5a24f47 --- /dev/null +++ b/attn_out_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_16k_l0_small/config.json b/attn_out_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d40de5b7fce10b6bc7e8ce9a4d5e6947f52d36fa --- /dev/null +++ b/attn_out_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_262k_l0_big/config.json b/attn_out_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..566bc5400bc47b78c9bb4777a6bef5e96b6e96db --- /dev/null +++ b/attn_out_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_262k_l0_small/config.json b/attn_out_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b61b975343cbae89239d1baa325693a2fb0dfc57 --- /dev/null +++ b/attn_out_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_16k_l0_big/config.json b/attn_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb672bdbc3922b3183eaff02cd7928bae919892d --- /dev/null +++ b/attn_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_16k_l0_small/config.json b/attn_out_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..86ac6b3fcf07a0e640f5fb339dadcdc7bd523b36 --- /dev/null +++ b/attn_out_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_262k_l0_big/config.json b/attn_out_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7133a468f262e1888a778a759f793d58d2e6793d --- /dev/null +++ b/attn_out_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_262k_l0_small/config.json b/attn_out_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..419e991d03812e72ccad7114b4ebfd28faf79071 --- /dev/null +++ b/attn_out_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_2_width_16k_l0_big/config.json b/attn_out_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fedf61adf1cd9e20006ca775510d7f0e8673106d --- /dev/null +++ b/attn_out_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.2.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_2_width_16k_l0_small/config.json b/attn_out_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a25af43a3c7ee9b44a8ae34cd01c6f96621d4f78 --- /dev/null +++ b/attn_out_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.2.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_2_width_262k_l0_big/config.json b/attn_out_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b20e4c6684ae6d2860a2fe28ebfb6bf06450ba7b --- /dev/null +++ b/attn_out_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.2.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_2_width_262k_l0_small/config.json b/attn_out_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ad4b7f31dbef88e8ef3aeca41cc173b55adf6623 --- /dev/null +++ b/attn_out_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.2.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_3_width_16k_l0_big/config.json b/attn_out_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ce85e8c8d783fdad88ec16d81fcf6729e8206db7 --- /dev/null +++ b/attn_out_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_3_width_16k_l0_small/config.json b/attn_out_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..513c62ce29dcdaf821a8176f3454ee678734d946 --- /dev/null +++ b/attn_out_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_3_width_262k_l0_big/config.json b/attn_out_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b5cd30fae04d16df40757636e5af510367a68d0b --- /dev/null +++ b/attn_out_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_3_width_262k_l0_small/config.json b/attn_out_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6caae0541211dc47bbcfc379790309c523f5f73b --- /dev/null +++ b/attn_out_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_4_width_16k_l0_big/config.json b/attn_out_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a306de2dff29a9432686c1b7f38ad70c82d9137b --- /dev/null +++ b/attn_out_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.4.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_4_width_16k_l0_small/config.json b/attn_out_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5db8170b91c17d1aad9a68d4d4c1f325a720ab82 --- /dev/null +++ b/attn_out_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.4.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_4_width_262k_l0_big/config.json b/attn_out_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..58b8c7552ebc1fe350b740298e010e8125eeb61b --- /dev/null +++ b/attn_out_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.4.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_4_width_262k_l0_small/config.json b/attn_out_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ff705eb54191ef191d94949306d5746a17954e2 --- /dev/null +++ b/attn_out_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.4.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_5_width_16k_l0_big/config.json b/attn_out_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..da4add676878d91886d69baf3e2de4342587a359 --- /dev/null +++ b/attn_out_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_5_width_16k_l0_small/config.json b/attn_out_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e26979f6d0a462e57529e63cfdcf43e9a0416ec6 --- /dev/null +++ b/attn_out_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_5_width_262k_l0_big/config.json b/attn_out_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ee5585b763987c64da559a968f7ef5693cad770 --- /dev/null +++ b/attn_out_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_5_width_262k_l0_small/config.json b/attn_out_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d5261dd063d1533628f13077a38e8352b2f53987 --- /dev/null +++ b/attn_out_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_6_width_16k_l0_big/config.json b/attn_out_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0db8cd790af7ab8d1c40f1de7938a0c0bf5fd9 --- /dev/null +++ b/attn_out_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_6_width_16k_l0_small/config.json b/attn_out_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2be3162d7598ea77ec6768e21f613914dd0ef67a --- /dev/null +++ b/attn_out_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_6_width_262k_l0_big/config.json b/attn_out_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9a9f25e4e955e8ed3aa252ff65e0afce7e96f7d1 --- /dev/null +++ b/attn_out_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_6_width_262k_l0_small/config.json b/attn_out_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ac94080d251ddc9d361f57d6fc5d53cb0a6b8da --- /dev/null +++ b/attn_out_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_16k_l0_big/config.json b/attn_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bffbac897dc81643c120776c9b742741d10573bb --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_16k_l0_small/config.json b/attn_out_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f4c6f95541f803539e40c3ee0849e489f79d5494 --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_262k_l0_big/config.json b/attn_out_all/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b8e7e6064902ffbb42bd2cf3c1d72b8de808e39 --- /dev/null +++ b/attn_out_all/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_262k_l0_small/config.json b/attn_out_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c8838e51473d06c1e1837829cbc61fbfc01eba --- /dev/null +++ b/attn_out_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_8_width_16k_l0_big/config.json b/attn_out_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..722fb69a797c192388df805d2cfe259e4dbe84ea --- /dev/null +++ b/attn_out_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.8.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_8_width_16k_l0_small/config.json b/attn_out_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0a61feb1042c7c2bd1fa319240bdb7f31a1359a --- /dev/null +++ b/attn_out_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.8.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_8_width_262k_l0_big/config.json b/attn_out_all/layer_8_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..003bea40e0d0b17cf44b64bc626a9fdec511af1f --- /dev/null +++ b/attn_out_all/layer_8_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.8.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_8_width_262k_l0_small/config.json b/attn_out_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..097f4f8cab064cc58c3f729bd974e2ab2abbc6fc --- /dev/null +++ b/attn_out_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.8.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_16k_l0_big/config.json b/attn_out_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..12cccd604560a9fc522b2e70763644572acfeb32 --- /dev/null +++ b/attn_out_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_16k_l0_small/config.json b/attn_out_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..616408bccf2cbf35f2e466d02594abad6e73a231 --- /dev/null +++ b/attn_out_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_262k_l0_big/config.json b/attn_out_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7f670a1a81d7af906aecf846aeb6f6e4d0064381 --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_262k_l0_small/config.json b/attn_out_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..03970488bc5ea4660e353673bd181f20e68727b5 --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_16k_l0_big/config.json b/mlp_out/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6f6060e5b855cd101b1c27dd78de40ac9aec3939 --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_16k_l0_medium/config.json b/mlp_out/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c00e87c5a2de3bf8fb30ce10652e4e5041b6076 --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_16k_l0_small/config.json b/mlp_out/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cfb09b8f5a36009100cbcce06d5d1d70321863e2 --- /dev/null +++ b/mlp_out/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_big/config.json b/mlp_out/layer_13_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..68dc9be6ee6160e63e392eaf52d105a6bccaabec --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_medium/config.json b/mlp_out/layer_13_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..205d74fc61c0ce750f37cfe50aafa0dee391ae9e --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_1m_l0_small/config.json b/mlp_out/layer_13_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba99322f72abc51475c5768dcccc80f98ad2ea4 --- /dev/null +++ b/mlp_out/layer_13_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_big/config.json b/mlp_out/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df5f1740bee7dff9be734c4a19ef07f50d3b627d --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_medium/config.json b/mlp_out/layer_13_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ca1ced082da28a7fee7224b7b5a7a3db4f56bdc6 --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_262k_l0_small/config.json b/mlp_out/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..59081c58731fad2786d5664cc458a178a66f2337 --- /dev/null +++ b/mlp_out/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_65k_l0_big/config.json b/mlp_out/layer_13_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b4d857d257c158b78f6ac377f0e23e6f5edcf0d --- /dev/null +++ b/mlp_out/layer_13_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_65k_l0_medium/config.json b/mlp_out/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..be54df8311c46cfe559c7c56f2041dc336cca059 --- /dev/null +++ b/mlp_out/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_13_width_65k_l0_small/config.json b/mlp_out/layer_13_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..caa2e14379ae8e94086debe834fe11d06be6175a --- /dev/null +++ b/mlp_out/layer_13_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_big/config.json b/mlp_out/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32003e6f6ec36ad4f6abdef5e6ba60236144220b --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_medium/config.json b/mlp_out/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2abaa94b99192a891451ba80ac24846c042f600d --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_small/config.json b/mlp_out/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..213d259462abc2c4f32a2d0a2c5a92aca9c483e3 --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_big/config.json b/mlp_out/layer_17_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b1af1494e4ce859f67072cda9cabdd5be1526763 --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_medium/config.json b/mlp_out/layer_17_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a94f6bd193a3dcbe001c90f06fc7cc5ad68bc43d --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_1m_l0_small/config.json b/mlp_out/layer_17_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c35a949e4a6efccd5a896f04caa97ed46fb7beb1 --- /dev/null +++ b/mlp_out/layer_17_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_big/config.json b/mlp_out/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d761e3c303c4fbe2b9345a0a6d4fc6b0bce81d --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_medium/config.json b/mlp_out/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..239ebdf01baad8fdeabd1ba60512560c8d99a0c3 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_small/config.json b/mlp_out/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..46e2880f80b02566f25ecec9c993d48fb77a3157 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_big/config.json b/mlp_out/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..399adf1db36eb2c88afe3f9276ee0f2694ba7f59 --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_medium/config.json b/mlp_out/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..89a3bc90373a8a47bcef6ada915c42acfd91367c --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_small/config.json b/mlp_out/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d3da78eab9216636db73cdf48bba20609e5f5341 --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_big/config.json b/mlp_out/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e956903a4e8ba23594e55688e8977ffefa2a9e56 --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_medium/config.json b/mlp_out/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2abf8413433a26c9f09600ecd4d4c6974c54652f --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_small/config.json b/mlp_out/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3af3f550dc704bec0a27d83c0c79856e1cb58e39 --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_big/config.json b/mlp_out/layer_22_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..68833f611010f8ecba64afa0e215806f7841477f --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_medium/config.json b/mlp_out/layer_22_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..560a543c6846117dbd12517a790ffd0fde0765ed --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_1m_l0_small/config.json b/mlp_out/layer_22_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e86b43526641d4cd664b6e9cc6f8fa503b8fba9 --- /dev/null +++ b/mlp_out/layer_22_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_big/config.json b/mlp_out/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0035677b04b19ad2607b1ed1ee477645b3a7e996 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_medium/config.json b/mlp_out/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aaab8b254e16c949a1b01c17fcc4538f75202a76 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_small/config.json b/mlp_out/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbafe6796045f4e47f31a9048267109e52b89f0 --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_big/config.json b/mlp_out/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ffd14221ef8c8ae158869859beed343641913f6 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_medium/config.json b/mlp_out/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d4f1ef44aae53125843ef27f887788b437926ff2 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_small/config.json b/mlp_out/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63a948e6a382351b1a52b90d714a36dcec71b2d5 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_big/config.json b/mlp_out/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5763d66c213a242099f3b02ff16cbb9bbcd9ad2a --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_medium/config.json b/mlp_out/layer_7_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..51d786fbdaa17e3131c1659fc9b679121751a63c --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_16k_l0_small/config.json b/mlp_out/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9959e039d841a84029869d51ed12003e527307 --- /dev/null +++ b/mlp_out/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_big/config.json b/mlp_out/layer_7_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c802bf4504461eda43d8ee5414ba38bc347bc6c --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_medium/config.json b/mlp_out/layer_7_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2946d161efe8362d9cef154391169691e3805469 --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_1m_l0_small/config.json b/mlp_out/layer_7_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32080468dbe62b4cb3dc9d139061f28a49bbb115 --- /dev/null +++ b/mlp_out/layer_7_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_big/config.json b/mlp_out/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2cf256bac61d94bac2a86d6937fa029f14d9eb7f --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_medium/config.json b/mlp_out/layer_7_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..734f42e59f3372d8683b2ba0954038da39505252 --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_262k_l0_small/config.json b/mlp_out/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fed01af8747d2606e52c10ed0df3aa4e2414edff --- /dev/null +++ b/mlp_out/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_big/config.json b/mlp_out/layer_7_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d3864ffe79359907aad86e75f801365461a7823 --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_medium/config.json b/mlp_out/layer_7_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4ed26e7b31ad56634f756c662136d77ae243de0f --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_7_width_65k_l0_small/config.json b/mlp_out/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d08f98742de17ae63d7cd3d6b63ae0cfc598433e --- /dev/null +++ b/mlp_out/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_big/config.json b/mlp_out_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..25534559f0e0876845d4efcddd84fa58c47ecddd --- /dev/null +++ b/mlp_out_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_small/config.json b/mlp_out_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0bebe13649da8824635144b3e9961f0c371a6742 --- /dev/null +++ b/mlp_out_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_big/config.json b/mlp_out_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..57be46f4138037b76295e1d0c3db86e4577f1710 --- /dev/null +++ b/mlp_out_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eaa31604ea199b81c8ff6a8e5146cfac8df78525 --- /dev/null +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_big/config.json b/mlp_out_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b29bb4f83c1fa4e64d2a53c0216667c6c6f82a8 --- /dev/null +++ b/mlp_out_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_small/config.json b/mlp_out_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb6011b70f238621a81b4107b4f92cda81536e8 --- /dev/null +++ b/mlp_out_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_big/config.json b/mlp_out_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d3c2694c0fe1cbc6ee8aea9e69ee02c4a3a08b58 --- /dev/null +++ b/mlp_out_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_small/config.json b/mlp_out_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e60f1884e70671952a4e3c49822b574316961be7 --- /dev/null +++ b/mlp_out_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_big/config.json b/mlp_out_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..16152e6c88490f7e112217a7af179074066fa93b --- /dev/null +++ b/mlp_out_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_small/config.json b/mlp_out_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c58ffe96eeaf0f8024eb1261aaa95154c821f6ed --- /dev/null +++ b/mlp_out_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_262k_l0_big/config.json b/mlp_out_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d85e62989697b07089449127f193c99433d548ef --- /dev/null +++ b/mlp_out_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_262k_l0_small/config.json b/mlp_out_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee68c5c960096dd10b8a4354da6558e85e135bf --- /dev/null +++ b/mlp_out_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_16k_l0_big/config.json b/mlp_out_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5e8da17d4bd00d508f0127794d2984b79e95087a --- /dev/null +++ b/mlp_out_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_16k_l0_small/config.json b/mlp_out_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9528d9dde78fbefc0ae36000b5f102f470f98a4b --- /dev/null +++ b/mlp_out_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_262k_l0_big/config.json b/mlp_out_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c953d89afc57503cd79574df996a04f1c537380f --- /dev/null +++ b/mlp_out_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_262k_l0_small/config.json b/mlp_out_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b43d94bf33c527c7537a8f3bd79c172d9dc07e9d --- /dev/null +++ b/mlp_out_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_big/config.json b/mlp_out_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e4a08eeb57982601f42eaf9159e8bc34aa9ffbad --- /dev/null +++ b/mlp_out_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_small/config.json b/mlp_out_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cfb09b8f5a36009100cbcce06d5d1d70321863e2 --- /dev/null +++ b/mlp_out_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_262k_l0_big/config.json b/mlp_out_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0f7f37e8871683078c7d42432612c1dd4c61a3c3 --- /dev/null +++ b/mlp_out_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_262k_l0_small/config.json b/mlp_out_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..59081c58731fad2786d5664cc458a178a66f2337 --- /dev/null +++ b/mlp_out_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_big/config.json b/mlp_out_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d51b15a7a27f91a73e16e0c449e02f6970057a5d --- /dev/null +++ b/mlp_out_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_small/config.json b/mlp_out_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bbfd7c78948b7ccf73c414030b1d01931d1e96dd --- /dev/null +++ b/mlp_out_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_big/config.json b/mlp_out_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..192045b49fd62d0ca036568fbf81bc3f09052d4c --- /dev/null +++ b/mlp_out_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_small/config.json b/mlp_out_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..74f1580b35a288d948638b5ee567ea2bfae4b5d5 --- /dev/null +++ b/mlp_out_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_big/config.json b/mlp_out_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b3f457ed44919d588171488a67dca18bd2591f49 --- /dev/null +++ b/mlp_out_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_small/config.json b/mlp_out_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f7730001201c2947198efc7be5f99ca99ecbee16 --- /dev/null +++ b/mlp_out_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_big/config.json b/mlp_out_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d4d7a2fc980736b0891b7d46670cb6c87721b93 --- /dev/null +++ b/mlp_out_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_small/config.json b/mlp_out_all/layer_15_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e1b395172affe23ac53234558c4557e33ef4ab76 --- /dev/null +++ b/mlp_out_all/layer_15_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_big/config.json b/mlp_out_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a5a20a1605678a53b90d05c137177b539c6449d --- /dev/null +++ b/mlp_out_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_small/config.json b/mlp_out_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9e3a27be735d54cb785be9ba3d94220b6e944c44 --- /dev/null +++ b/mlp_out_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_big/config.json b/mlp_out_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3f3455acdd5d2430679930408a3fcd32dbcc7f6a --- /dev/null +++ b/mlp_out_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_small/config.json b/mlp_out_all/layer_16_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe73155db25a54ab40b843e019b701a0f7e6aa61 --- /dev/null +++ b/mlp_out_all/layer_16_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_big/config.json b/mlp_out_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e2b9a0a125a2b68d056d9452d0f9649707d2f33c --- /dev/null +++ b/mlp_out_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_small/config.json b/mlp_out_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..213d259462abc2c4f32a2d0a2c5a92aca9c483e3 --- /dev/null +++ b/mlp_out_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_big/config.json b/mlp_out_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a1726030d5b154a274aff8675e4244b26a0f36b --- /dev/null +++ b/mlp_out_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_small/config.json b/mlp_out_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..46e2880f80b02566f25ecec9c993d48fb77a3157 --- /dev/null +++ b/mlp_out_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_16k_l0_big/config.json b/mlp_out_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..014c98440ac78081b08eddb8b23c7a0a82101478 --- /dev/null +++ b/mlp_out_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_16k_l0_small/config.json b/mlp_out_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e8940a52a2ec283061a34a44241b15bedb77e63f --- /dev/null +++ b/mlp_out_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_262k_l0_big/config.json b/mlp_out_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a80dd8d6620fb65dfd4c6b10e179ee78db28f29e --- /dev/null +++ b/mlp_out_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_262k_l0_small/config.json b/mlp_out_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f5a33643ee492256c62b0312aebee9bf6fa13d2 --- /dev/null +++ b/mlp_out_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_16k_l0_big/config.json b/mlp_out_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fad929533f0261834b81122b1a54b468057befa7 --- /dev/null +++ b/mlp_out_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_16k_l0_small/config.json b/mlp_out_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8c470c902fb40949949c2ac0215c4f411eb3ad5c --- /dev/null +++ b/mlp_out_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_262k_l0_big/config.json b/mlp_out_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bc8e3980518d7d7f31846496524d6b4cf6610524 --- /dev/null +++ b/mlp_out_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_262k_l0_small/config.json b/mlp_out_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5234856dfea05d74c1a639c20bfd0ca9404f6e95 --- /dev/null +++ b/mlp_out_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_16k_l0_big/config.json b/mlp_out_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7c57efb0043c26e8278c742c622099a8b5cd3c21 --- /dev/null +++ b/mlp_out_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_16k_l0_small/config.json b/mlp_out_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..08dd194382fdfc214efb7767e3afec4aa5ac017d --- /dev/null +++ b/mlp_out_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_262k_l0_big/config.json b/mlp_out_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..646f0643ea8f7ac6257387f23372541a3a67540d --- /dev/null +++ b/mlp_out_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_262k_l0_small/config.json b/mlp_out_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..97c1d370cf20f0f617574b8af4255eb0ef494ed2 --- /dev/null +++ b/mlp_out_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_20_width_16k_l0_big/config.json b/mlp_out_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9efbe37636bf976856ce94660b133bcde0d2f15c --- /dev/null +++ b/mlp_out_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_20_width_16k_l0_small/config.json b/mlp_out_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..79a1d5d5c1bef52295db379d05decccd569b17c5 --- /dev/null +++ b/mlp_out_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_20_width_262k_l0_big/config.json b/mlp_out_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b47d5fa36f8a5661baf47ef7d66598effa50848 --- /dev/null +++ b/mlp_out_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_20_width_262k_l0_small/config.json b/mlp_out_all/layer_20_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8159aa685d86ba928de952f9f776ff5607737e06 --- /dev/null +++ b/mlp_out_all/layer_20_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_16k_l0_big/config.json b/mlp_out_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9167a300e6ddf0c54c2abd3214110793350ec645 --- /dev/null +++ b/mlp_out_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_16k_l0_small/config.json b/mlp_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a969c0aa15e971f9bcea5b9b29ff1667148ab907 --- /dev/null +++ b/mlp_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_262k_l0_big/config.json b/mlp_out_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f80bde3fab7bbf50aa236db2cc9d934427b3db89 --- /dev/null +++ b/mlp_out_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_262k_l0_small/config.json b/mlp_out_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..198f52d16cbec28fac590fe9dbc4be4201fd4580 --- /dev/null +++ b/mlp_out_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_16k_l0_big/config.json b/mlp_out_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f01f4cdbedf9bb2a19dc9f34e83faaf3a31081b8 --- /dev/null +++ b/mlp_out_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_16k_l0_small/config.json b/mlp_out_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3af3f550dc704bec0a27d83c0c79856e1cb58e39 --- /dev/null +++ b/mlp_out_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_262k_l0_big/config.json b/mlp_out_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ba0bdf8e6a7fb960abf1cd2b5a31da85069977 --- /dev/null +++ b/mlp_out_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_262k_l0_small/config.json b/mlp_out_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbafe6796045f4e47f31a9048267109e52b89f0 --- /dev/null +++ b/mlp_out_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_16k_l0_big/config.json b/mlp_out_all/layer_23_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..69a73f862456d07ffced136b9e13005711716d10 --- /dev/null +++ b/mlp_out_all/layer_23_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_16k_l0_small/config.json b/mlp_out_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bca757a261e48efde11834de0603f86cf2fe7966 --- /dev/null +++ b/mlp_out_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_big/config.json b/mlp_out_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c74b7f22800b6864246d66a9af56b3d24de159f4 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_small/config.json b/mlp_out_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e3b3f2d25d247eab3b2968b75b2cce90c601704 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_16k_l0_big/config.json b/mlp_out_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e66cc74e12ffe3b5733d9829c5d33cabe40dccb --- /dev/null +++ b/mlp_out_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_16k_l0_small/config.json b/mlp_out_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cef1538ef3c6c3f9efb34ca66f7281552c997bbf --- /dev/null +++ b/mlp_out_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_262k_l0_big/config.json b/mlp_out_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c8eaec9857bacd0cec1f07c7ee36fbe693c4648 --- /dev/null +++ b/mlp_out_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_262k_l0_small/config.json b/mlp_out_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..db52e2e1c19b4bd56cbcaff02bc7523a41f062aa --- /dev/null +++ b/mlp_out_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_big/config.json b/mlp_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23933222b4709ca7e66fe512a05b25f5eb36fd1a --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_small/config.json b/mlp_out_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3e09598c4f6b4203e3e1d7e3672ec6b5cb12028 --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_262k_l0_big/config.json b/mlp_out_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..510c653214f91a16f3aec5bec00570b3cb68c1a8 --- /dev/null +++ b/mlp_out_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_262k_l0_small/config.json b/mlp_out_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b3b90fc23fca3d09298dd196aed4792199bdd949 --- /dev/null +++ b/mlp_out_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_big/config.json b/mlp_out_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0621ee004e9417dc3383317d2fc461c15e03d2b2 --- /dev/null +++ b/mlp_out_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_small/config.json b/mlp_out_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a79f0fb4a866651840c420e0ddfa461e909be6c --- /dev/null +++ b/mlp_out_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_big/config.json b/mlp_out_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..65ab25721924d2929ed4069485190854f66ee01c --- /dev/null +++ b/mlp_out_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_small/config.json b/mlp_out_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..05b1e91ff41c3c06935fdb3b961146f4f7b3dc0d --- /dev/null +++ b/mlp_out_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_big/config.json b/mlp_out_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a45c3728c57e44ceaba9fd5214482ada124da9a4 --- /dev/null +++ b/mlp_out_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_small/config.json b/mlp_out_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..653cdede2b0cf58c0382bc41106f423a92a9d137 --- /dev/null +++ b/mlp_out_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_big/config.json b/mlp_out_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..833768931feead0667805e0812d907dd55f4d4d8 --- /dev/null +++ b/mlp_out_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_small/config.json b/mlp_out_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f3fa9dc048fb5fa4db6f29ce59f4e59fffc8085 --- /dev/null +++ b/mlp_out_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_big/config.json b/mlp_out_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1089372e1e84ee76a6133644b1138d6da8dca1 --- /dev/null +++ b/mlp_out_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_small/config.json b/mlp_out_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c765a0e610c0294c1953138167def2f4310cd955 --- /dev/null +++ b/mlp_out_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_big/config.json b/mlp_out_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0dc91898d675529ea5fd6fbecaab62eac58557 --- /dev/null +++ b/mlp_out_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_small/config.json b/mlp_out_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26ffeeab4a1e47b1de3da4d35758ba11fab51cb9 --- /dev/null +++ b/mlp_out_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_big/config.json b/mlp_out_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9ed68688533f6c6ae4f86dd7dba2bc25e4d65cce --- /dev/null +++ b/mlp_out_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_small/config.json b/mlp_out_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..90df762b4b8865fa3c85a777aa9c15dfa991e724 --- /dev/null +++ b/mlp_out_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_big/config.json b/mlp_out_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f103ebffc11c36e49cf39a5786b4f042945e9fd9 --- /dev/null +++ b/mlp_out_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_small/config.json b/mlp_out_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..719bf340903d805139c243428a45101690166038 --- /dev/null +++ b/mlp_out_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_big/config.json b/mlp_out_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e953a1c50f34afe44b5976e689a7a8cde9335aa6 --- /dev/null +++ b/mlp_out_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_small/config.json b/mlp_out_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aca23868eb62a3d1e8ef7da4e7b4f5ce6fefe0e0 --- /dev/null +++ b/mlp_out_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_262k_l0_big/config.json b/mlp_out_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4eda547babe958ec96ce31c8e00d0719e43b4ffa --- /dev/null +++ b/mlp_out_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_262k_l0_small/config.json b/mlp_out_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1695a531f93aaffda6c3284d0eead997e19ccebb --- /dev/null +++ b/mlp_out_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a864574d25e86be1172a2c27cb04f11ccc8c9a5 --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_small/config.json b/mlp_out_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9959e039d841a84029869d51ed12003e527307 --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_big/config.json b/mlp_out_all/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..98537569fdf64e4173831db6afc42522e7530282 --- /dev/null +++ b/mlp_out_all/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_small/config.json b/mlp_out_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fed01af8747d2606e52c10ed0df3aa4e2414edff --- /dev/null +++ b/mlp_out_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_big/config.json b/mlp_out_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c7421b851aa103ae0b43cab38836f53e6c85b078 --- /dev/null +++ b/mlp_out_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_small/config.json b/mlp_out_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..56da40f751671d7a4801f7a52182e920d58e72e5 --- /dev/null +++ b/mlp_out_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_big/config.json b/mlp_out_all/layer_8_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb37507986db31c78563db514f81bb371f792f80 --- /dev/null +++ b/mlp_out_all/layer_8_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_small/config.json b/mlp_out_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..484babb1bba8b7de7368e4e55c264c5ca47f1497 --- /dev/null +++ b/mlp_out_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_16k_l0_big/config.json b/mlp_out_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0812b6271962faa772b047a6b9f078c12de846f8 --- /dev/null +++ b/mlp_out_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_16k_l0_small/config.json b/mlp_out_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd49423024426a796e4643a7bac57520525d5d32 --- /dev/null +++ b/mlp_out_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_big/config.json b/mlp_out_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfddf20b10041f27dbef7f5ba07452357d463425 --- /dev/null +++ b/mlp_out_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_small/config.json b/mlp_out_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..46e0ff3b4f5c6b698dbdf8f3d0b4d41a29c436d3 --- /dev/null +++ b/mlp_out_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_16k_l0_big/config.json b/resid_post/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f65125439151d45c4e72a798354654bdf638a25a --- /dev/null +++ b/resid_post/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_16k_l0_medium/config.json b/resid_post/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b25dd9422862ba9fc54e6ba7b067b56476e30cb7 --- /dev/null +++ b/resid_post/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_16k_l0_small/config.json b/resid_post/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3500422c93fab42e71b148374c8aaa3d3e0aa9bb --- /dev/null +++ b/resid_post/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_1m_l0_big/config.json b/resid_post/layer_13_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5a913d76c4434ae39ecdbec0b4b0b7fcfb85b745 --- /dev/null +++ b/resid_post/layer_13_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_1m_l0_medium/config.json b/resid_post/layer_13_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d271c64513933748cf6ff3f5a135977f1d7ac6fc --- /dev/null +++ b/resid_post/layer_13_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_1m_l0_small/config.json b/resid_post/layer_13_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..89861502655b0751ad0b0102e8ecc34c0cc008c0 --- /dev/null +++ b/resid_post/layer_13_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_262k_l0_big/config.json b/resid_post/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26af8d6e83e93abfb44bd237c4da592147b59576 --- /dev/null +++ b/resid_post/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_262k_l0_medium/config.json b/resid_post/layer_13_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6f98d160cd0d682996b5cd112324d6d08c82570e --- /dev/null +++ b/resid_post/layer_13_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_13_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6f98d160cd0d682996b5cd112324d6d08c82570e --- /dev/null +++ b/resid_post/layer_13_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_262k_l0_small/config.json b/resid_post/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc9dd4c6e4c1e41383cae57e478ad3a4d1e9750 --- /dev/null +++ b/resid_post/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_65k_l0_big/config.json b/resid_post/layer_13_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cdecc34ef6d5f608314454c379608d64ddd362d3 --- /dev/null +++ b/resid_post/layer_13_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_65k_l0_medium/config.json b/resid_post/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..369dcf1701fb4c99023468539e3536ac517149d5 --- /dev/null +++ b/resid_post/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_13_width_65k_l0_small/config.json b/resid_post/layer_13_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..955e8ae33441f7c8d0c4117a20c99d89a2907731 --- /dev/null +++ b/resid_post/layer_13_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_big/config.json b/resid_post/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe44ceb08570f81833c42fd810856728cfc81f20 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_medium/config.json b/resid_post/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0c7ece12d46f934ac0e35d50b17b8e8b84199d98 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_small/config.json b/resid_post/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..64fb256376e32c5d5446b1106311959c222b7936 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_big/config.json b/resid_post/layer_17_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fee3271ec5199397031361b8a10f802be9b64b63 --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_medium/config.json b/resid_post/layer_17_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..08758794972c8faaa92da1c4398623d42f01a4be --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_small/config.json b/resid_post/layer_17_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f0f02c7d62434dc7e21dd223cff37fc4ef0abab --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_big/config.json b/resid_post/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b08fc1ba2d1a2e0ddf38ae5e6a42096b1abb2e06 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_medium/config.json b/resid_post/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..485936ffb528f2ae3ebe4e476c1963cbb3785d63 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..485936ffb528f2ae3ebe4e476c1963cbb3785d63 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_small/config.json b/resid_post/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa1624d9f36ba191555ac1a17da83f6a033a0478 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_big/config.json b/resid_post/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3dde1afdb8848d6693917562b3b5aa36191f9d9d --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_medium/config.json b/resid_post/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..72b38eea3de941ff98a385169aca5c140eadedff --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_small/config.json b/resid_post/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7acd4f2577b6a376848173e3ea97614d0ca8f4b4 --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_big/config.json b/resid_post/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..16f151b1b84a05d51f3b4c29671ec7482be4b5e9 --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_medium/config.json b/resid_post/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf6535ce9dfd668fbf31ae7d9f761683d079fe9 --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_small/config.json b/resid_post/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..54c890ab28a0891c2010361894feb06feb995908 --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_big/config.json b/resid_post/layer_22_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4073506057752e9b50b737f7f3f00a77b4c045cc --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_medium/config.json b/resid_post/layer_22_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b1c24b5bf9c01f05ab5a331f24748ac52c7a4924 --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_small/config.json b/resid_post/layer_22_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a94c30b8f452f0f34e032d5c31f1396fd5405bd --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_big/config.json b/resid_post/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..145f6c016521f4957044088c9d0fab1511bc6bb5 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_medium/config.json b/resid_post/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba22a6f8dac13e58b48e3da90d77b22b31056980 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba22a6f8dac13e58b48e3da90d77b22b31056980 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_small/config.json b/resid_post/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e903498498f9c3fddcc3cf7d7f409a028483968 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_big/config.json b/resid_post/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d69e7078c1546a8d55341133fd4ea5b5650ba9d6 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_medium/config.json b/resid_post/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..496c1ced1510b2d96c3fad2afaaf0f790ebb09d0 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_65k_l0_small/config.json b/resid_post/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d21c861953a814b1e77d3dbbde446ec385132cb3 --- /dev/null +++ b/resid_post/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_16k_l0_big/config.json b/resid_post/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..425843d7bf14574b276eee621f3ed59e243142c6 --- /dev/null +++ b/resid_post/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_16k_l0_medium/config.json b/resid_post/layer_7_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2dbceb31b1e06afce599f65875984c89b5677e43 --- /dev/null +++ b/resid_post/layer_7_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_16k_l0_small/config.json b/resid_post/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dc23fe895649680c9f6ceb9b8db9c3b13e773b85 --- /dev/null +++ b/resid_post/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_1m_l0_big/config.json b/resid_post/layer_7_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..16afa2d98c672207827a4a1eb6e9c373f81984ee --- /dev/null +++ b/resid_post/layer_7_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_1m_l0_medium/config.json b/resid_post/layer_7_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d3633b968a03e581c4e506235faca17252a4a99c --- /dev/null +++ b/resid_post/layer_7_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_1m_l0_small/config.json b/resid_post/layer_7_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9279dd9891bba3f921976b17b4ba7b2f6dca08d2 --- /dev/null +++ b/resid_post/layer_7_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 1048576, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_262k_l0_big/config.json b/resid_post/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c3195038b009d7cb0b9dd746ad80e4c54ce56f6f --- /dev/null +++ b/resid_post/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_262k_l0_medium/config.json b/resid_post/layer_7_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba9c686054068aa47131fb48fde3dfb037077e5b --- /dev/null +++ b/resid_post/layer_7_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_7_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba9c686054068aa47131fb48fde3dfb037077e5b --- /dev/null +++ b/resid_post/layer_7_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_262k_l0_small/config.json b/resid_post/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ae4694fdd4170808ed7b8627f0a13c4529e7401 --- /dev/null +++ b/resid_post/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_65k_l0_big/config.json b/resid_post/layer_7_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5096233928ecc8a7f86681358fb612cb879b97e0 --- /dev/null +++ b/resid_post/layer_7_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_65k_l0_medium/config.json b/resid_post/layer_7_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..adc5da5ccdd50d6f2b6b33a4f9b48da74ebb3e6d --- /dev/null +++ b/resid_post/layer_7_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_7_width_65k_l0_small/config.json b/resid_post/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a62ac8a412c4ae415937475b2f579722e464bc46 --- /dev/null +++ b/resid_post/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_16k_l0_big/config.json b/resid_post_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c101c318fe6fdefdf585b5861dcc960f247789f1 --- /dev/null +++ b/resid_post_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_16k_l0_small/config.json b/resid_post_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8d7d80ab1361e7591e841fa16a24c26fe2fdae0d --- /dev/null +++ b/resid_post_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_big/config.json b/resid_post_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..711d0744599836391ccf0c23ef2cb37e74870125 --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_small/config.json b/resid_post_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9514cccfbca9355ac126aedef18fe8fb23d7fb3b --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_big/config.json b/resid_post_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7085ac4be4f59f90851ec0c2f099b61854f73220 --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_small/config.json b/resid_post_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..adcb2026b6ad9ddd32be341e4dff9b386e06753d --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_big/config.json b/resid_post_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aad15c4a5b1a477111c55be914e6678476c5dd9b --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_small/config.json b/resid_post_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c505b26d848e7fe56eaae312d9e9db08096970c2 --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_big/config.json b/resid_post_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..978def9f4d9982a5c321b68e0aaf714d7913bb70 --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_16k_l0_small/config.json b/resid_post_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..66015c984114112e2486f2b21c887ee5d5cd9fc6 --- /dev/null +++ b/resid_post_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_262k_l0_big/config.json b/resid_post_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3d57e5033ed85ab4b53f7e24d3e61baf5b3488ac --- /dev/null +++ b/resid_post_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_11_width_262k_l0_small/config.json b/resid_post_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea22edbf32cc41d54cb082b4bb725a2f1916d277 --- /dev/null +++ b/resid_post_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.output", + "hf_hook_point_out": "model.layers.11.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_big/config.json b/resid_post_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..71588751094e652dc5b5fbdfa212db780bb427b9 --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_small/config.json b/resid_post_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..506ae9dd0ab21b98cc27001277325c7cf95e1944 --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_big/config.json b/resid_post_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6586ce69ed8b8dcd2e9cda4a4dfaf21ac33d5749 --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_small/config.json b/resid_post_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aff976b616778db2321dcddfe245cba5c99367bd --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_big/config.json b/resid_post_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b12824b369ba91440976e6ea2b956064f1d644fc --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_small/config.json b/resid_post_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3500422c93fab42e71b148374c8aaa3d3e0aa9bb --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_262k_l0_big/config.json b/resid_post_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8abc272723b9bd999b04095497eed91a776772b6 --- /dev/null +++ b/resid_post_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_262k_l0_small/config.json b/resid_post_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc9dd4c6e4c1e41383cae57e478ad3a4d1e9750 --- /dev/null +++ b/resid_post_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_big/config.json b/resid_post_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..883969097e7ece68e39b2047940267c99d9444d1 --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_small/config.json b/resid_post_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..613108e6acc323ee871276c2d2092df5a753ba01 --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_262k_l0_big/config.json b/resid_post_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..64db65a33e0a821764a7db2878d5f2b9cff96e94 --- /dev/null +++ b/resid_post_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_262k_l0_small/config.json b/resid_post_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb97513c4cc020a570f3e2812910b1d6c4e1c7fc --- /dev/null +++ b/resid_post_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_big/config.json b/resid_post_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f843af0e81d3987e126157f70a023efef2c034a3 --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_small/config.json b/resid_post_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca9b52fbc02ac815bbcf1cfb646bbd2cd096dfd --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_262k_l0_big/config.json b/resid_post_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..afb36daba9aa7d8a49c0fd5cd1d83dde6b2cae44 --- /dev/null +++ b/resid_post_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_262k_l0_small/config.json b/resid_post_all/layer_15_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cafc262d7f1081d220f2a401e30d69d716c04d2d --- /dev/null +++ b/resid_post_all/layer_15_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_big/config.json b/resid_post_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b22125eccf74e66bf4209189be7fa3092df7d81 --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_small/config.json b/resid_post_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44650f38dfd2e1f86401a6eeb1cdc73dc19e23c0 --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_big/config.json b/resid_post_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3fc759d77772e9654c8d918a6d6edd0d40b2936 --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_small/config.json b/resid_post_all/layer_16_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8570974a54bd7c072812d5da7484c666140eb6d5 --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_big/config.json b/resid_post_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6591e825f206ab5db7b6e7a8d329ce0c051f819d --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_small/config.json b/resid_post_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..64fb256376e32c5d5446b1106311959c222b7936 --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_big/config.json b/resid_post_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ccf6283ba2c862396bc7c1320008946652588b6f --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_small/config.json b/resid_post_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa1624d9f36ba191555ac1a17da83f6a033a0478 --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_big/config.json b/resid_post_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..10994fbd8dc178a7ea13a4e2ebd14f172ff794d4 --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_small/config.json b/resid_post_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a5caa099f753df21139b4f90e33d004c75eea96 --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_262k_l0_big/config.json b/resid_post_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aca962bf694835e0beb2e6567d938b090a30c9ba --- /dev/null +++ b/resid_post_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_262k_l0_small/config.json b/resid_post_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c0a93a9f8a41f9eda89efc8d6c017ee47c3a976e --- /dev/null +++ b/resid_post_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_16k_l0_big/config.json b/resid_post_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c9f9413549debb6922284af1d52a5f337de77db1 --- /dev/null +++ b/resid_post_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_16k_l0_small/config.json b/resid_post_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d72d5ff7bd1264c79e564682f8dac918c2eeb590 --- /dev/null +++ b/resid_post_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_big/config.json b/resid_post_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..354676768a9886b616f615028ff860e709223308 --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_small/config.json b/resid_post_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e53f1325f41d544b2350a588c8c57369d99cb615 --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_16k_l0_big/config.json b/resid_post_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..890dfefa52e36889433606be62531d6d887d382a --- /dev/null +++ b/resid_post_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_16k_l0_small/config.json b/resid_post_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9bb81cfe7baf023d7131d36cc0d2f75d0da1fa6 --- /dev/null +++ b/resid_post_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_big/config.json b/resid_post_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b3844c7cee165cb71f926851304679d199e482d --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_small/config.json b/resid_post_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11b5e5869285c803d6093bf3f0f2ab55bd53fbe4 --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_16k_l0_big/config.json b/resid_post_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5155910ed3c05a19c75da838a2ce1178edee5d62 --- /dev/null +++ b/resid_post_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_16k_l0_small/config.json b/resid_post_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa2f3fa39e0b185d1a11343b197c238c1308e30e --- /dev/null +++ b/resid_post_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_262k_l0_big/config.json b/resid_post_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0add8c93c357c2d501b7b7cdf4475334c780368f --- /dev/null +++ b/resid_post_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_262k_l0_small/config.json b/resid_post_all/layer_20_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9b2cd54a8d02eda8314b4171442bb92a819924df --- /dev/null +++ b/resid_post_all/layer_20_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_16k_l0_big/config.json b/resid_post_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df09190e700ebccd54b71f09aefca7d752493072 --- /dev/null +++ b/resid_post_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_16k_l0_small/config.json b/resid_post_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..206c953bb179fb84ec0c3ab6f15219117a04b2b6 --- /dev/null +++ b/resid_post_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_big/config.json b/resid_post_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b13ea3abae4db70de220016b6a4eef47bbf6f6f4 --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_small/config.json b/resid_post_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c96cd2195b0580a116064436c7ce512c07e94d05 --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_big/config.json b/resid_post_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..34616571f2f3bb96a50d140cb4530b2086bef481 --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_small/config.json b/resid_post_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..54c890ab28a0891c2010361894feb06feb995908 --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_big/config.json b/resid_post_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fd99f53f8317a19a8de95d3ea5588f6452eec7f4 --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_small/config.json b/resid_post_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e903498498f9c3fddcc3cf7d7f409a028483968 --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_16k_l0_big/config.json b/resid_post_all/layer_23_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..673c9acea809b8a7ebc07929099dcf8c81a53e82 --- /dev/null +++ b/resid_post_all/layer_23_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_16k_l0_small/config.json b/resid_post_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e5914980093956a84aa984d00269335f86086e52 --- /dev/null +++ b/resid_post_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_big/config.json b/resid_post_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d92415bc0f34907b5890314ca40021ae8388c49 --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_small/config.json b/resid_post_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32097a5a22bd9907221e69dd0859dcd6a6b7d580 --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_big/config.json b/resid_post_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6405f4780eefc99e9bfde078c725b27d68375b43 --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_small/config.json b/resid_post_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..487de585e28db410f7dbf6be750eacd939803aaa --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_262k_l0_big/config.json b/resid_post_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df6c7dd8fb52fa02853ee2946ace660e47cade5b --- /dev/null +++ b/resid_post_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_262k_l0_small/config.json b/resid_post_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a286bf415a978006d7e51fe9133c7cd5350dbf5 --- /dev/null +++ b/resid_post_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_big/config.json b/resid_post_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a1b2daf74feb11d5258517a037fae2ab68c0222 --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_small/config.json b/resid_post_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8014b0de261da97cf706a039e94b07fcae740566 --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_big/config.json b/resid_post_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c38d15225fa8e767a10bcab2ab0b3b47ab513b61 --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_small/config.json b/resid_post_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..13dc1ba3a0e284c6f240a0b7bfe65749f9d9e031 --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_big/config.json b/resid_post_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b097834d1323e09c99ab3265cb68944b2ec3f129 --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_small/config.json b/resid_post_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..565c5ee509b59c82b088f8707b6cdef3a95ee2c4 --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_262k_l0_big/config.json b/resid_post_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..addb79fe1bbdab085f21fe4eee67a4f895f63524 --- /dev/null +++ b/resid_post_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_262k_l0_small/config.json b/resid_post_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2848f30ec7462bf2f7821880cbab2504e51f16 --- /dev/null +++ b/resid_post_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_big/config.json b/resid_post_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..92d533382711e2a0f36e6932b5abdd649496ef92 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_small/config.json b/resid_post_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e5557c04d33e51dabe29ae6e6d5a42ff638471c3 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_262k_l0_big/config.json b/resid_post_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5309e593b5acf459c75c6708790abe0a79f088d --- /dev/null +++ b/resid_post_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_262k_l0_small/config.json b/resid_post_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f45d6dac8df6e66dd916ecc332128587e095916d --- /dev/null +++ b/resid_post_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_big/config.json b/resid_post_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f273f65b78dce2e73af123d6e8f6277cb0ac7ce3 --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_small/config.json b/resid_post_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5155209dd6fb68fe726cb30304aa0cb20da6133 --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_big/config.json b/resid_post_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..60c52cf3b0a0c0ef2348182dbbe6f26f9f042f70 --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_small/config.json b/resid_post_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..976c7953ccd5252271fb6cff9ef4b18a11c14e7a --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_big/config.json b/resid_post_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..80a9bbdc048259a812c34aff8322aa679e60ba26 --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_small/config.json b/resid_post_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ab6e14676eb199af1a62accecca95b68fcc2072e --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_big/config.json b/resid_post_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..68a6aa2d01f67f018fc0d0d6f1549d4b3331cd56 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_small/config.json b/resid_post_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b4266a29d06859b3a7ad5afb81e216f25f26b66 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_big/config.json b/resid_post_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..45496bb476893b3cd0098f65d231d07d20ef9e84 --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_small/config.json b/resid_post_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5448503eb50f0e6d1fe85a8fc123b82a5cd0a370 --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_big/config.json b/resid_post_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1931b0ed3d13ea15f3906625f78a192bcc07134e --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_small/config.json b/resid_post_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f5d76b00041c038100dae63f37ba8a2dbf3750fd --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_16k_l0_big/config.json b/resid_post_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e562844db149acf4f9d67b3100638438426b41fa --- /dev/null +++ b/resid_post_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_16k_l0_small/config.json b/resid_post_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dc23fe895649680c9f6ceb9b8db9c3b13e773b85 --- /dev/null +++ b/resid_post_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_262k_l0_big/config.json b/resid_post_all/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e4f325b811edce089e69eafcb936efaa55255b36 --- /dev/null +++ b/resid_post_all/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_262k_l0_small/config.json b/resid_post_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ae4694fdd4170808ed7b8627f0a13c4529e7401 --- /dev/null +++ b/resid_post_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_big/config.json b/resid_post_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..79697bdf859f8aeee2867bd8c59c1e29a4f847cf --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_small/config.json b/resid_post_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d19ece358d0c12e0e5ca4c0066065cd5cf098a7a --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_262k_l0_big/config.json b/resid_post_all/layer_8_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b11f81679144f54ae89356f92dc8ba510bf729f4 --- /dev/null +++ b/resid_post_all/layer_8_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_262k_l0_small/config.json b/resid_post_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..50f977002577160a3da2c3cba9f8426d3ed71318 --- /dev/null +++ b/resid_post_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_16k_l0_big/config.json b/resid_post_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a8024ee7c13460eaa9e61cc9fdc9f143cbf7133d --- /dev/null +++ b/resid_post_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_16k_l0_small/config.json b/resid_post_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ea73a96637b63bc7156a4e5a5cdfd392603da08 --- /dev/null +++ b/resid_post_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_big/config.json b/resid_post_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..51be68fa2c3a1513d0db7d079a97a956219ab298 --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_small/config.json b/resid_post_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eace80ccdcde344e5b375ede645057bf39e71bd3 --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_big/config.json b/transcoder/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d1118825ea05410e653547c8d2030575cc3035e9 --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_big_affine/config.json b/transcoder/layer_13_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0144bb8b62d37ca26ecf4b6c0420832833c3e55e --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_medium/config.json b/transcoder/layer_13_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..afb38494ac107aa824f0d5d96e3b1e5bd374db0a --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_medium_affine/config.json b/transcoder/layer_13_width_16k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4bfababcb7fa6b6b86245b3a9820582b825e4ac5 --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_small/config.json b/transcoder/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb222f7865d72f49c1f1217ca83b68431074153b --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_16k_l0_small_affine/config.json b/transcoder/layer_13_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..750ea79d4136dbad53e761b07c0b8e43a8801afe --- /dev/null +++ b/transcoder/layer_13_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_big/config.json b/transcoder/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b5637ae5a90e5171335d4724909784daa77d75a --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_big_affine/config.json b/transcoder/layer_13_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fce2b0256240b61c5c26e34009cd788f7c58756 --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_medium/config.json b/transcoder/layer_13_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..719ce89d052bad8dfab0022b3f5ebe8b51633eaa --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_medium_affine/config.json b/transcoder/layer_13_width_262k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..93461c0e7024e6f98b4aba54d8b42c0db724127e --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_small/config.json b/transcoder/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d685a78e48d198acc0779f9c2207589c37254a9 --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_262k_l0_small_affine/config.json b/transcoder/layer_13_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f6ca1178faa13b843e2ac0b638946e0fd8333f3 --- /dev/null +++ b/transcoder/layer_13_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_big/config.json b/transcoder/layer_13_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f869c350730180ee0b35b05f98fbb767cca2a7e5 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_big_affine/config.json b/transcoder/layer_13_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e1e4d258ce737aba8e0746f79bf8b665e1313e28 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_medium/config.json b/transcoder/layer_13_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f0a911438133d14877cfad652f532324846f6235 --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_medium_affine/config.json b/transcoder/layer_13_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f3004b7481baee148476da62600cbdbf83f7eada --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_small/config.json b/transcoder/layer_13_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..403497b76cc502b942f6d796419dadda8ab8a11d --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_13_width_65k_l0_small_affine/config.json b/transcoder/layer_13_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..580bd5dd37f0b381e526e326e8e353b275f20c6d --- /dev/null +++ b/transcoder/layer_13_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_big/config.json b/transcoder/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..01fc3c805536934f8d033e5b05f6392cc257c9ff --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_big_affine/config.json b/transcoder/layer_17_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec78bd61c675048012d200ee0635bb4ae49b436f --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_medium/config.json b/transcoder/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ca0f741fe3e7362f6b7a600b46dfd9c914bb349 --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_medium_affine/config.json b/transcoder/layer_17_width_16k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba39db062ea9b1334c9cb3d6e984b97d5fd3c91 --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_small/config.json b/transcoder/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8bd3d7e8b9b375afad41321e955cfd57329445 --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_16k_l0_small_affine/config.json b/transcoder/layer_17_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ddab2869cfa109d43189ac7afbefc9a8e7d338 --- /dev/null +++ b/transcoder/layer_17_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_big/config.json b/transcoder/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..93e87589931b759c9140b35d0beba11e85b7b98b --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_big_affine/config.json b/transcoder/layer_17_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef02dca3db672e9fd446fc0d614065f41898f44a --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_medium/config.json b/transcoder/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..18a1d309e329c1515d53f680b3bad471b1f72183 --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_medium_affine/config.json b/transcoder/layer_17_width_262k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d7fd9d5b45d784a7358ec09ec11a13a865acf76 --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_small/config.json b/transcoder/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c819bc03ba8c94fa5612fd0685f1b6de37cd632b --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_262k_l0_small_affine/config.json b/transcoder/layer_17_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..feb0d0ed6303a5fcd32bf1c580fe727ceb015240 --- /dev/null +++ b/transcoder/layer_17_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_big/config.json b/transcoder/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0af82c780ed0d94a574631f4c85e5e84e1a3d337 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_big_affine/config.json b/transcoder/layer_17_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e57e8207f0103322e29c570a4dfa00c15f2f635 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_medium/config.json b/transcoder/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a7ad7934fe7c18077a9deec8d62b2eff121183a --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_medium_affine/config.json b/transcoder/layer_17_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a9b67c9ca27b7ba83a1595c00a35f60633be1d9e --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_small/config.json b/transcoder/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e07f60a66c39c11be4c3141d583d472e85b42b0 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_17_width_65k_l0_small_affine/config.json b/transcoder/layer_17_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f088348426152b93318f369f8be3ed2c5ad683b6 --- /dev/null +++ b/transcoder/layer_17_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_big/config.json b/transcoder/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2b03f352bbc2c5493942915984b4a2601880abea --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_big_affine/config.json b/transcoder/layer_22_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1bb7df7e3edd722b46ec8e35a97660e876b7e3 --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_medium/config.json b/transcoder/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b8b1a1e3670d6026fb4b5d8fc2b5a6e1dcbc5d71 --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_medium_affine/config.json b/transcoder/layer_22_width_16k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d2812d0848014d26db2bbf22045cdba3f759d5e --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_small/config.json b/transcoder/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf58ed6ef7b5a61942598c50936d3a337b2a19c --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_16k_l0_small_affine/config.json b/transcoder/layer_22_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e95c55cd5219c311bec880db067f9065c9325650 --- /dev/null +++ b/transcoder/layer_22_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_big/config.json b/transcoder/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d28b69f011765934ad863659c28660111ddb31af --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_big_affine/config.json b/transcoder/layer_22_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1fd427f502eb5d92d76ecec73e9b68290e4a1086 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_medium/config.json b/transcoder/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..829a1ce5efc663fcf64e412ba2577f9ec5be0eef --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_medium_affine/config.json b/transcoder/layer_22_width_262k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b83d1094f6c656a3fd2371444072233d021bf6f6 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_small/config.json b/transcoder/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a46582af764ee273bd59b516fdff562a2263635 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_262k_l0_small_affine/config.json b/transcoder/layer_22_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..119d8eeb13d84f8e57f4865d387b66fb33a365b2 --- /dev/null +++ b/transcoder/layer_22_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_big/config.json b/transcoder/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f308ec21360d3322e712ee7858c034b9cc8ff4 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_big_affine/config.json b/transcoder/layer_22_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8340634af4d363098b7393312a75dece95b1124 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_medium/config.json b/transcoder/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a27e5e9e429f33ef069123f55ebcc8f18a59fa2 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_medium_affine/config.json b/transcoder/layer_22_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..461d6923650a12dd706b05b89748e174f24c0b78 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_small/config.json b/transcoder/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..15287bb904cc64314fd9d30dc4952fd88266f7a4 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_22_width_65k_l0_small_affine/config.json b/transcoder/layer_22_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5bcc3762200c472b79050d3e36ddee7d9b45ea4 --- /dev/null +++ b/transcoder/layer_22_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_big/config.json b/transcoder/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7f8a81d570e8649732d3a9508af3b2a0442fba0b --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_big_affine/config.json b/transcoder/layer_7_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b78ee229a4cc952eaef1069efa4e6255420defdb --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_medium/config.json b/transcoder/layer_7_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..38a04b3ce4a1eb35e75ca5a9bb3d0fb851342e6f --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_medium_affine/config.json b/transcoder/layer_7_width_16k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3633dd82209a817e924af91065b714d52224d7d5 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_small/config.json b/transcoder/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..414b325f42ba82345aaf713058b6b6d453feb7e3 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_16k_l0_small_affine/config.json b/transcoder/layer_7_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39164479977cae362718fc07708c4247bc0cd883 --- /dev/null +++ b/transcoder/layer_7_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_big/config.json b/transcoder/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3634931d63bc70b661d1f101388e0faa1d3c7dc8 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_big_affine/config.json b/transcoder/layer_7_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8e55024be0effaae78513a0c36fc48ad9646219 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_medium/config.json b/transcoder/layer_7_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7ccbe8b63ce4e4aea95b9f12e68331aa8ed0d6 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_medium_affine/config.json b/transcoder/layer_7_width_262k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b007e16b2d0e69b52eea035b420673306625ef51 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_small/config.json b/transcoder/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b72fe63e54aa8fed639ef832e9fe4b919f1978be --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_262k_l0_small_affine/config.json b/transcoder/layer_7_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c447ce084f724a4dcfb7e1f897335733c7b61a41 --- /dev/null +++ b/transcoder/layer_7_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_big/config.json b/transcoder/layer_7_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2803562db1b36c7372847453744cf776a489b9b9 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_big_affine/config.json b/transcoder/layer_7_width_65k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..868dafefd1b97a7bb1992c4cfa749d4dd917dd2f --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 132, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_medium/config.json b/transcoder/layer_7_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1fd58959920f471b518aebef08de42fc2f1fb289 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_medium_affine/config.json b/transcoder/layer_7_width_65k_l0_medium_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..99cf932224e04ef7bc8bcab5085dad463338ad80 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_medium_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 54, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_small/config.json b/transcoder/layer_7_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d30ea937b3a27701741282057a39ca0922f09e7 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder/layer_7_width_65k_l0_small_affine/config.json b/transcoder/layer_7_width_65k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9c0ad06ac8ea5c3bddc14eeb073d030039bbd00 --- /dev/null +++ b/transcoder/layer_7_width_65k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_big/config.json b/transcoder_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ddcf0ebf2ef94e879889a35de8739619f51a0190 --- /dev/null +++ b/transcoder_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_big_affine/config.json b/transcoder_all/layer_0_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..be531084c2cb4a64aa06392e6f3ef0fdb7a3f953 --- /dev/null +++ b/transcoder_all/layer_0_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_small/config.json b/transcoder_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dd9ff2f75fd0b43cfba0046c5614df5e34adb51d --- /dev/null +++ b/transcoder_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_small_affine/config.json b/transcoder_all/layer_0_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..adeec1aef33549cdcd14a2115d9c17a032b83da2 --- /dev/null +++ b/transcoder_all/layer_0_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big/config.json b/transcoder_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..48e58c7fc298792eac7a1495c11debb0c4b110db --- /dev/null +++ b/transcoder_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big_affine/config.json b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..080620a93a9bb7c10f485485249ae0449fc27533 --- /dev/null +++ b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small/config.json b/transcoder_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1c751ed0671fac8e3cdca77e9d9663c699286078 --- /dev/null +++ b/transcoder_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small_affine/config.json b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..19491ac19842b31ec956766c86e0e333a5ab743c --- /dev/null +++ b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_big/config.json b/transcoder_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3c3eeafd58e1caeb07464362130d25fc649204b3 --- /dev/null +++ b/transcoder_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_big_affine/config.json b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0e981b13eb0f1cfb980cf21e5054946ea397c285 --- /dev/null +++ b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small/config.json b/transcoder_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..73d0651200dcda530c2e9dce2a3905ef3e46bba9 --- /dev/null +++ b/transcoder_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small_affine/config.json b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3127e2e0c7cbe67fce7c6f4ec3bb394709e85db --- /dev/null +++ b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big/config.json b/transcoder_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea29a19d0eeba34be6c33536f3185552a0534b24 --- /dev/null +++ b/transcoder_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5e724882376efb2fa6babe2eb34b1b8a3d968e4d --- /dev/null +++ b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_small/config.json b/transcoder_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2515fef7b309ff63e29e587fa02cc13005c4884a --- /dev/null +++ b/transcoder_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_small_affine/config.json b/transcoder_all/layer_10_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..95e430b63bb05ef7c1c311a6f730ac391142bf9e --- /dev/null +++ b/transcoder_all/layer_10_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_big/config.json b/transcoder_all/layer_11_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..99cf887558a57af35f5140d3e6825f2a98022b16 --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_big_affine/config.json b/transcoder_all/layer_11_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ae237a964db09b5f2c7010728f34abfbd653a95d --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small/config.json b/transcoder_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..206efd561acb09179912c1083a1124dff564d941 --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small_affine/config.json b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0fbc9156dc91c8816c9a6e94a3ddc41a3f358f6 --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_big/config.json b/transcoder_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..76dbb496c221e2ab48703a9aab59a60cde8cf91d --- /dev/null +++ b/transcoder_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_big_affine/config.json b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2cebf0b5461a4f31638b286e6f5e13488aae491 --- /dev/null +++ b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small/config.json b/transcoder_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed9def67a35cdfb9149bbff5ab7986ba6fdd370 --- /dev/null +++ b/transcoder_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small_affine/config.json b/transcoder_all/layer_11_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe46293994fe246a379f44e89824754914bf1e9e --- /dev/null +++ b/transcoder_all/layer_11_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_big/config.json b/transcoder_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff19d66eb7fd317a333a8df184e17225d42f95c1 --- /dev/null +++ b/transcoder_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_big_affine/config.json b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ab22d6fed0a00a14789290cd53d9ca6be418ff8d --- /dev/null +++ b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_small/config.json b/transcoder_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..59fbaedc343d677591e0c55caca5e9243d2ab21b --- /dev/null +++ b/transcoder_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_small_affine/config.json b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8530f4d4ee2c1ddbe625052f07d1fc25334e9ce9 --- /dev/null +++ b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_big/config.json b/transcoder_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..09305b94f4df2fe80383a02c7e834f32c99af072 --- /dev/null +++ b/transcoder_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_big_affine/config.json b/transcoder_all/layer_12_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..06c4db63037d94084a87f35bf909ce14eb70db6f --- /dev/null +++ b/transcoder_all/layer_12_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_small/config.json b/transcoder_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a4adab7e32e35412b76ab722d22365d1a5ee24c --- /dev/null +++ b/transcoder_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_small_affine/config.json b/transcoder_all/layer_12_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2fc8a9eb1bfcf30c77510e269720435e94a1253e --- /dev/null +++ b/transcoder_all/layer_12_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big/config.json b/transcoder_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6b5656c667cce11df2bab8fc7548fa153d605846 --- /dev/null +++ b/transcoder_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ef884f7d0c5e44624708ef343c6af5bb756e2e8 --- /dev/null +++ b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small/config.json b/transcoder_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb222f7865d72f49c1f1217ca83b68431074153b --- /dev/null +++ b/transcoder_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small_affine/config.json b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..750ea79d4136dbad53e761b07c0b8e43a8801afe --- /dev/null +++ b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big/config.json b/transcoder_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..504a33f426d0bb43cda5163e4364ed02c4416db6 --- /dev/null +++ b/transcoder_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82ca8b28ec3600e21dd9f364d88187f637948076 --- /dev/null +++ b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small/config.json b/transcoder_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d685a78e48d198acc0779f9c2207589c37254a9 --- /dev/null +++ b/transcoder_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small_affine/config.json b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f6ca1178faa13b843e2ac0b638946e0fd8333f3 --- /dev/null +++ b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big/config.json b/transcoder_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7b1ad710271ca1f5b9a46557a0631eed3d7073f0 --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big_affine/config.json b/transcoder_all/layer_14_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c5f221160859759f5fa754c8d825aee9b21b578 --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_small/config.json b/transcoder_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5d2e808a32d4e4302aa2ec4fe6008b8bd627f5d1 --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_small_affine/config.json b/transcoder_all/layer_14_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3967b0112e067b885dc048f28b1b1f906d78d6 --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_big/config.json b/transcoder_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4569aa74905459f8855955c7be2d389f3bd5ea0e --- /dev/null +++ b/transcoder_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_big_affine/config.json b/transcoder_all/layer_14_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fefb38fe74b6b48d6cbedf548cf7ba7791bcf02 --- /dev/null +++ b/transcoder_all/layer_14_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_small/config.json b/transcoder_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e261eb7c93e242a0d625e32b45df9f06b303aff3 --- /dev/null +++ b/transcoder_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_small_affine/config.json b/transcoder_all/layer_14_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a4b905ae2f5a026d40682d00ad5538b1e906f764 --- /dev/null +++ b/transcoder_all/layer_14_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big/config.json b/transcoder_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d1ba4936ee2edfaa7c1ad8a82c3376cef1f96ec0 --- /dev/null +++ b/transcoder_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big_affine/config.json b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..36125b604cca194243474e312742e109a203c600 --- /dev/null +++ b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_small/config.json b/transcoder_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..74717087d9753e1d02bdc29dc41d3598cacfdc23 --- /dev/null +++ b/transcoder_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_small_affine/config.json b/transcoder_all/layer_15_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cff78372a7f195c09b38f8697ba1f3a1e91ad53c --- /dev/null +++ b/transcoder_all/layer_15_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big/config.json b/transcoder_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e184fd84dcc05b27532aa1054129d9b19c2de34 --- /dev/null +++ b/transcoder_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big_affine/config.json b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..01554f6fe18176db37ca839ca41198d997225428 --- /dev/null +++ b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_small/config.json b/transcoder_all/layer_15_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfd8e3f3ea505729758560f7bc2c41971f238581 --- /dev/null +++ b/transcoder_all/layer_15_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_small_affine/config.json b/transcoder_all/layer_15_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..95c12d079681b98bd1130788f5511a520ebbe3bc --- /dev/null +++ b/transcoder_all/layer_15_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_big/config.json b/transcoder_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..10ad7dd857ad0783802af7a62751cd3b88ae58f3 --- /dev/null +++ b/transcoder_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_big_affine/config.json b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c1d515a43dcadf3b529a91a94142651532ae784 --- /dev/null +++ b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_small/config.json b/transcoder_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..446cf22c726c7fc56b3e02f89db6cd03c3f02df5 --- /dev/null +++ b/transcoder_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_small_affine/config.json b/transcoder_all/layer_16_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..43ff827876ef735789f37b696fe401418d476ccb --- /dev/null +++ b/transcoder_all/layer_16_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_big/config.json b/transcoder_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63e312fdf31d7ece7d7004bd090f9708f5a46e68 --- /dev/null +++ b/transcoder_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_big_affine/config.json b/transcoder_all/layer_16_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9dea4dadd2b7c071326c0d39780c5bf7b9c4de20 --- /dev/null +++ b/transcoder_all/layer_16_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small/config.json b/transcoder_all/layer_16_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23c5219b3d7d2939f2980f6d1c51121bcb956820 --- /dev/null +++ b/transcoder_all/layer_16_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d19a9cba6cefbc3a61821c5f486677a52222024 --- /dev/null +++ b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big/config.json b/transcoder_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1da5f4d6e40a67b2f36a2c11130a16d0e80fd9 --- /dev/null +++ b/transcoder_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big_affine/config.json b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..334a1be56ffafce50f17c6d0bc2f26507ccfefef --- /dev/null +++ b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_small/config.json b/transcoder_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8bd3d7e8b9b375afad41321e955cfd57329445 --- /dev/null +++ b/transcoder_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_small_affine/config.json b/transcoder_all/layer_17_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ddab2869cfa109d43189ac7afbefc9a8e7d338 --- /dev/null +++ b/transcoder_all/layer_17_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big/config.json b/transcoder_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..03df0d35cada1027f47669beb53cd1fbc526b9c5 --- /dev/null +++ b/transcoder_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big_affine/config.json b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a85de9db38adb0a5b3594f8c47ac31c06a38a9e2 --- /dev/null +++ b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small/config.json b/transcoder_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c819bc03ba8c94fa5612fd0685f1b6de37cd632b --- /dev/null +++ b/transcoder_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..feb0d0ed6303a5fcd32bf1c580fe727ceb015240 --- /dev/null +++ b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_big/config.json b/transcoder_all/layer_18_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..250a50298923e92a731188c3b3bcf6fe08f778fc --- /dev/null +++ b/transcoder_all/layer_18_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_big_affine/config.json b/transcoder_all/layer_18_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a813a490a00384c1f797ee280a7322ff2a1ee643 --- /dev/null +++ b/transcoder_all/layer_18_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_small/config.json b/transcoder_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..349628091c8cedda9a17c56213e7933e303ce622 --- /dev/null +++ b/transcoder_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_small_affine/config.json b/transcoder_all/layer_18_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..00a3a986df9cb378ef8ed65149f5334c1b19bd10 --- /dev/null +++ b/transcoder_all/layer_18_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_big/config.json b/transcoder_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a48915766fc445f2761fc1d8974e115771d1d750 --- /dev/null +++ b/transcoder_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_big_affine/config.json b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5d65a499b143b76f959649c366a42992491927fb --- /dev/null +++ b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_small/config.json b/transcoder_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a2ed01ddad6b6207aee9b5ef0817b667da64d10 --- /dev/null +++ b/transcoder_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_small_affine/config.json b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2c860553f4169c75315091b7d35859dd36bdf321 --- /dev/null +++ b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_big/config.json b/transcoder_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b28e23ade5c3d62792ab0d1a70b4c4471b4231b1 --- /dev/null +++ b/transcoder_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_big_affine/config.json b/transcoder_all/layer_19_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7aae80ce8f96e9005ec76a2e56b75ed6dd36368 --- /dev/null +++ b/transcoder_all/layer_19_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_small/config.json b/transcoder_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f34cdca2cde9a229dc539ec55198622b1acf424b --- /dev/null +++ b/transcoder_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_small_affine/config.json b/transcoder_all/layer_19_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..205668561c312082701c2e4976f0011562f3729b --- /dev/null +++ b/transcoder_all/layer_19_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big/config.json b/transcoder_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8c72624a832377b8b02bfdaecef0f3377b0998c --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big_affine/config.json b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53f2206e9f393464f14a23a0b22675ea72971306 --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_small/config.json b/transcoder_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..31ecf6cf47dd513b67935a6ec30a721c6d95591b --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_small_affine/config.json b/transcoder_all/layer_19_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ec421d3955ab11d0de919afcc7135d6c65eb42 --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_big/config.json b/transcoder_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..548d674139831ba3485a4b0817dbceb54949db6e --- /dev/null +++ b/transcoder_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_big_affine/config.json b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d367915b5af0fd257d546dfeb4691a17b604c1a5 --- /dev/null +++ b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_small/config.json b/transcoder_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff09b53d8d8ea66e2e61e1d4551671f1dbfda8ac --- /dev/null +++ b/transcoder_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_small_affine/config.json b/transcoder_all/layer_1_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf97423eeaaafc6558028940342a9bb0f46d98c8 --- /dev/null +++ b/transcoder_all/layer_1_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_big/config.json b/transcoder_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0c26a64d50ad1ecd4a16ab9c37fb523b96d7acb9 --- /dev/null +++ b/transcoder_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_big_affine/config.json b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cce9a27602d81ce77c69f33b32e4e8e4b60cbc8a --- /dev/null +++ b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 66, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small/config.json b/transcoder_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a8edc707eb536e5ae6dab1a71449a0ebe93f19c --- /dev/null +++ b/transcoder_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..521f6b0975149e83d9a747be89d6cf040cda900e --- /dev/null +++ b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_big/config.json b/transcoder_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9397a2d60a938021dc3044934ce1501badf77e34 --- /dev/null +++ b/transcoder_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_big_affine/config.json b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8eda85ac9a2739711fd74e4087608594e2bd2118 --- /dev/null +++ b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_small/config.json b/transcoder_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ae2c2fde1ea6d14ff672041f8f5302072c7554e4 --- /dev/null +++ b/transcoder_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_small_affine/config.json b/transcoder_all/layer_20_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5461d310e9f966fe25d0ce93d61c1129747d4d52 --- /dev/null +++ b/transcoder_all/layer_20_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_big/config.json b/transcoder_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee2f179992c4f93fecc9d0e4217cf937dbdda3f --- /dev/null +++ b/transcoder_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_big_affine/config.json b/transcoder_all/layer_20_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6edb29ba4cbd48aa4f71af70ea2617310adbd584 --- /dev/null +++ b/transcoder_all/layer_20_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_small/config.json b/transcoder_all/layer_20_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..857af33ed3d6778918451cb8eedbc6dffc47ad7e --- /dev/null +++ b/transcoder_all/layer_20_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_small_affine/config.json b/transcoder_all/layer_20_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0debc2adcc064cc95e08941e3f8766baf33f04f8 --- /dev/null +++ b/transcoder_all/layer_20_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_big/config.json b/transcoder_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b01498f739ad09c0684cf1396807764d5f65a8a5 --- /dev/null +++ b/transcoder_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_big_affine/config.json b/transcoder_all/layer_21_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5a04f6341b87cf7afd19ac8174aa2b7c6edd757f --- /dev/null +++ b/transcoder_all/layer_21_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_small/config.json b/transcoder_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5460619164e1d3f6a015a044020f37c51012bb10 --- /dev/null +++ b/transcoder_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_small_affine/config.json b/transcoder_all/layer_21_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..278ed1e2b65d1b67f0fbe778198206859040881a --- /dev/null +++ b/transcoder_all/layer_21_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_big/config.json b/transcoder_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1227eb70b88ef0af5f814b6930ea9775cb57cfe2 --- /dev/null +++ b/transcoder_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_big_affine/config.json b/transcoder_all/layer_21_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..75018dd6185e1aa00ebd28ad9c5c8751fdaf6484 --- /dev/null +++ b/transcoder_all/layer_21_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_small/config.json b/transcoder_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..16de75d38c810652c4a904dd3998bf875cce5479 --- /dev/null +++ b/transcoder_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_small_affine/config.json b/transcoder_all/layer_21_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ace801c963b2a79e5bdf790e21b161feec2ae50 --- /dev/null +++ b/transcoder_all/layer_21_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big/config.json b/transcoder_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44b07efcd1a6bd17af3e27fe4660423bb368aac7 --- /dev/null +++ b/transcoder_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big_affine/config.json b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c38462c14b7edd658b204c59a1ee44bd5d3fc53 --- /dev/null +++ b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_small/config.json b/transcoder_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf58ed6ef7b5a61942598c50936d3a337b2a19c --- /dev/null +++ b/transcoder_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_small_affine/config.json b/transcoder_all/layer_22_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e95c55cd5219c311bec880db067f9065c9325650 --- /dev/null +++ b/transcoder_all/layer_22_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_big/config.json b/transcoder_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2cbc4afab6e6f55e53992ba17df146ec3ae0631 --- /dev/null +++ b/transcoder_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_big_affine/config.json b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a04d6850482e1e7a58c0af1405e819a8e1d60e37 --- /dev/null +++ b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_small/config.json b/transcoder_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a46582af764ee273bd59b516fdff562a2263635 --- /dev/null +++ b/transcoder_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_small_affine/config.json b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..119d8eeb13d84f8e57f4865d387b66fb33a365b2 --- /dev/null +++ b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_big/config.json b/transcoder_all/layer_23_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..efab328a4c608d606bbbd63f027c965b6910cc9e --- /dev/null +++ b/transcoder_all/layer_23_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_big_affine/config.json b/transcoder_all/layer_23_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..089b0c3f67372c470ea17ad021c8aca735933009 --- /dev/null +++ b/transcoder_all/layer_23_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_small/config.json b/transcoder_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..37ec30edf47a74d92f3ea0fd667b343f14567f84 --- /dev/null +++ b/transcoder_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_small_affine/config.json b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..18dcb9850331f5ee46607f7df6da5e5ac332fd01 --- /dev/null +++ b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_big/config.json b/transcoder_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5cd4ab22da79432789a2be01452e771fccc021 --- /dev/null +++ b/transcoder_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_big_affine/config.json b/transcoder_all/layer_23_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec673a6315d319b5b44788885e5d69363ab86c2c --- /dev/null +++ b/transcoder_all/layer_23_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_small/config.json b/transcoder_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d25f624e6c01ca69995fb4936352380d09e319a3 --- /dev/null +++ b/transcoder_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_small_affine/config.json b/transcoder_all/layer_23_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b595718ba2ccd85d95534f006859effc40b9b864 --- /dev/null +++ b/transcoder_all/layer_23_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_big/config.json b/transcoder_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..83c74cfc12ab9efb28934ad68f5284423650435f --- /dev/null +++ b/transcoder_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_big_affine/config.json b/transcoder_all/layer_24_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..05ec47d54dfe485d281446814c3d91f3aed8c042 --- /dev/null +++ b/transcoder_all/layer_24_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_small/config.json b/transcoder_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9299e500b47bb9c02c005435654989ce9fd7eef --- /dev/null +++ b/transcoder_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_small_affine/config.json b/transcoder_all/layer_24_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a90232a592da77fd0721fc0ac87a6b5de1bc024 --- /dev/null +++ b/transcoder_all/layer_24_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_big/config.json b/transcoder_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..595d33c1cb077e5e8b0c36dc2b910279b7a5f804 --- /dev/null +++ b/transcoder_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_big_affine/config.json b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..73304312c238151d74c3f73981eb7735789bbd9e --- /dev/null +++ b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_small/config.json b/transcoder_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a103f29b0f16c2aec9c5ebe5ecd254b9c1cb60c2 --- /dev/null +++ b/transcoder_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_small_affine/config.json b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1782bfb1ae48a6023cbf16e1e6d0df17ef670729 --- /dev/null +++ b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_big/config.json b/transcoder_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a014e90ddaaaa81b93fa866b6c120a147cfed4ef --- /dev/null +++ b/transcoder_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_big_affine/config.json b/transcoder_all/layer_25_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9826b5515da482692ad8dfbc1fd43865d82385e9 --- /dev/null +++ b/transcoder_all/layer_25_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small/config.json b/transcoder_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..06496caef49febe722b951063dd364a2c50ae546 --- /dev/null +++ b/transcoder_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small_affine/config.json b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d9b55ad7d9ad833cb696136ad2705c08eeee32d --- /dev/null +++ b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_big/config.json b/transcoder_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..959d208bea9b5509e10fffdc5a01613dee2f561c --- /dev/null +++ b/transcoder_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_big_affine/config.json b/transcoder_all/layer_25_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e9653f6b933e13a8f54f78a138975682c9d16bcf --- /dev/null +++ b/transcoder_all/layer_25_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_small/config.json b/transcoder_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1d22f3b3f9ceb5ab62e8b6dc33f4b60af2847259 --- /dev/null +++ b/transcoder_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_small_affine/config.json b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef088ea1edc7e7188089ef5e072754de57103b08 --- /dev/null +++ b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big/config.json b/transcoder_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8098d739ed3c6c2680b88a4a17b3816e133eb4af --- /dev/null +++ b/transcoder_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big_affine/config.json b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..94cfa0369f90855fb99dab32f88129662f4692ef --- /dev/null +++ b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_small/config.json b/transcoder_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf627ed8091d58131a0eb44a95c295f640c2006f --- /dev/null +++ b/transcoder_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_small_affine/config.json b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5f21214063c6574dde1bd97b180c81c0d80f4df2 --- /dev/null +++ b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big/config.json b/transcoder_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b4f9223dfc5473bcc0aaf8d2329514b11f2ce8ea --- /dev/null +++ b/transcoder_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big_affine/config.json b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7ffe7b2cf50ed7ad77abb4ad27a56cb5b100802c --- /dev/null +++ b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 73, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small/config.json b/transcoder_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a83a9d7c70c8101d7e42566025380004b03df53f --- /dev/null +++ b/transcoder_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small_affine/config.json b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7cc6375e4abf9be1bd5fd1bd7973bab12519094b --- /dev/null +++ b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_big/config.json b/transcoder_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4cec6f174333981d1f43ebb96e2c58f1b4b9cd60 --- /dev/null +++ b/transcoder_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_big_affine/config.json b/transcoder_all/layer_3_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa370a65ffc4d9d70bbcdb0916a007c148e0fe0 --- /dev/null +++ b/transcoder_all/layer_3_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small/config.json b/transcoder_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9a48f05924d920e6d4bce863de99912c7c5dfab5 --- /dev/null +++ b/transcoder_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2f4a12e93bf41cf8847df51c45caac6204ec318 --- /dev/null +++ b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big/config.json b/transcoder_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..19c4def52166dddfcea161b7cbc079b3f582f896 --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big_affine/config.json b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ece9d4f2969ccd8e83e98f7894be31adc60423b --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small/config.json b/transcoder_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3052777a9c467ed4ce75dc15fa09d29dba32afac --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2fe1490ed3bdd07da70c582da6350a053a126ff0 --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_big/config.json b/transcoder_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3f65879b93cc4a279f45d28470a6363cb19ebf39 --- /dev/null +++ b/transcoder_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_big_affine/config.json b/transcoder_all/layer_4_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..540bad0ec0b806515e079f9d601c8ab0150d7954 --- /dev/null +++ b/transcoder_all/layer_4_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_small/config.json b/transcoder_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..51f55a57cf66fbe2214203a4d036fbc25eeeccf3 --- /dev/null +++ b/transcoder_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ccf460982e736b2744dbe5c4031c1392f932814d --- /dev/null +++ b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_big/config.json b/transcoder_all/layer_4_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..04b3fbd5812b2e7920388e27ba863ea0ef3f846a --- /dev/null +++ b/transcoder_all/layer_4_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_big_affine/config.json b/transcoder_all/layer_4_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c14966c0b301c952e5af32cf19e8540c9fae3028 --- /dev/null +++ b/transcoder_all/layer_4_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 87, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small/config.json b/transcoder_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..81ae366933e057dc5961b63a8d092c07e455f14c --- /dev/null +++ b/transcoder_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8823b2ca13a08f3d76268acc0b7419ac62e7f32 --- /dev/null +++ b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big/config.json b/transcoder_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b59c7d20974ed181e73d80d1db7656d79980c174 --- /dev/null +++ b/transcoder_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big_affine/config.json b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e88cada8fc03d03f60c1c9420dde2441cf4edd91 --- /dev/null +++ b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_small/config.json b/transcoder_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fdaca305898d673a60f3e4aad86801a7a286d296 --- /dev/null +++ b/transcoder_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_small_affine/config.json b/transcoder_all/layer_5_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9a558543b8e7ce839fe9d9d2fa04caff5559b50a --- /dev/null +++ b/transcoder_all/layer_5_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big/config.json b/transcoder_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5fc7bde8a457185a47093802c6b61e9758a668a5 --- /dev/null +++ b/transcoder_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big_affine/config.json b/transcoder_all/layer_5_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..503220c43bc42123d483faf1979a4551a5652b85 --- /dev/null +++ b/transcoder_all/layer_5_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 94, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_small/config.json b/transcoder_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c029a7545002579e4f4e3956266a58be997c9626 --- /dev/null +++ b/transcoder_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_small_affine/config.json b/transcoder_all/layer_5_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..747f0afcedaa3e83533e903c77c45a41ba71068e --- /dev/null +++ b/transcoder_all/layer_5_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_big/config.json b/transcoder_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c09c698df99e984b78de62c9757f7fbab9acdcd --- /dev/null +++ b/transcoder_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_big_affine/config.json b/transcoder_all/layer_6_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c3df5a7d671e7a938d14886d7968f049417df3db --- /dev/null +++ b/transcoder_all/layer_6_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_small/config.json b/transcoder_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..610913b68e19e89dca42ca07cbf55e2825aef644 --- /dev/null +++ b/transcoder_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_small_affine/config.json b/transcoder_all/layer_6_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..94f9d809feea9ff638c66670f2c07ed6c70f8f0c --- /dev/null +++ b/transcoder_all/layer_6_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_big/config.json b/transcoder_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6221b8fa7474579b696b7a5a9a03116047abc43d --- /dev/null +++ b/transcoder_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_big_affine/config.json b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b14da011fc07070ea4ed908907e1267add1051c --- /dev/null +++ b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 101, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_small/config.json b/transcoder_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63d17f72b44613c9b4a8943ccabe1b84509a314b --- /dev/null +++ b/transcoder_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_small_affine/config.json b/transcoder_all/layer_6_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a10b5e275573e62459d42c9be41cacd6a4b24da --- /dev/null +++ b/transcoder_all/layer_6_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_big/config.json b/transcoder_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eff5d2e79003ab959a4742e052b54c90372ca078 --- /dev/null +++ b/transcoder_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_big_affine/config.json b/transcoder_all/layer_7_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c41e2d661cb673ab87cd713cac00e15b7bf98639 --- /dev/null +++ b/transcoder_all/layer_7_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small/config.json b/transcoder_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..414b325f42ba82345aaf713058b6b6d453feb7e3 --- /dev/null +++ b/transcoder_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39164479977cae362718fc07708c4247bc0cd883 --- /dev/null +++ b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big/config.json b/transcoder_all/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..735b6242442734ef6de69c92dcf48ccf4cf218d8 --- /dev/null +++ b/transcoder_all/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big_affine/config.json b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..815994c3e52d41f9e9a4d1610872f4ddcd9e6c1d --- /dev/null +++ b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small/config.json b/transcoder_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b72fe63e54aa8fed639ef832e9fe4b919f1978be --- /dev/null +++ b/transcoder_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small_affine/config.json b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c447ce084f724a4dcfb7e1f897335733c7b61a41 --- /dev/null +++ b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_big/config.json b/transcoder_all/layer_8_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26889a1d662cdfe85aea9d42af55a904c21018de --- /dev/null +++ b/transcoder_all/layer_8_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_big_affine/config.json b/transcoder_all/layer_8_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0bfb0d8021e1f7fe3bba4e497665cdf5901e6e33 --- /dev/null +++ b/transcoder_all/layer_8_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_small/config.json b/transcoder_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..55ed260c0fac40f48d571b95cbf5821c301f87ab --- /dev/null +++ b/transcoder_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_small_affine/config.json b/transcoder_all/layer_8_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b111dad4c53b85b0f200db273ec75347158db816 --- /dev/null +++ b/transcoder_all/layer_8_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big/config.json b/transcoder_all/layer_8_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcecac30789971c3639e7ee39c0e46696bfc1ef --- /dev/null +++ b/transcoder_all/layer_8_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big_affine/config.json b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f298cb4c885036278177c468fc9359c159e2fd2c --- /dev/null +++ b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 115, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_small/config.json b/transcoder_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b9a4402141e449101f6d55099b65b47ee2a6a967 --- /dev/null +++ b/transcoder_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_small_affine/config.json b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..01e416ed60e0806424e6fa773e3d497bf079e48d --- /dev/null +++ b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big/config.json b/transcoder_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2955620f9c742e7c0047264136780aa20c43d81b --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big_affine/config.json b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fde3b3b9a1fe14b33572cad4f80dad056f2a0b18 --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small/config.json b/transcoder_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..52d6577965b6814ae078abb188d4c61953a8ef2a --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2006006e6a095bc3aacc5166d56706c1b4c2d7a0 --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_big/config.json b/transcoder_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba59733127e294c10fa6b3f840a4f8ba29138927 --- /dev/null +++ b/transcoder_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_big_affine/config.json b/transcoder_all/layer_9_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c70133c69adf29b33ccc32de68df33bc27228066 --- /dev/null +++ b/transcoder_all/layer_9_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small/config.json b/transcoder_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..30d0957fbf8e4eacd8a4c997ea01831f8f29b20f --- /dev/null +++ b/transcoder_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39db0030af17bea048b01cba8a9e3cce5cc2a933 --- /dev/null +++ b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-1b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file