diff --git a/mlp_out/layer_17_width_16k_l0_big/config.json b/mlp_out/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4cabdd145a9ae46704f94dbe567560bfe6b13968 --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_medium/config.json b/mlp_out/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0959c478d44367ee7e59dbd776a6388fbdd5b498 --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_16k_l0_small/config.json b/mlp_out/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8d116f91d6a97091c2e6b1d3a5af28172c67fbf --- /dev/null +++ b/mlp_out/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_big/config.json b/mlp_out/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f4dfd416a5f2c662ea95d7dc039fa933aa02bde8 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_medium/config.json b/mlp_out/layer_17_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe5523d295f41d05c6a28b495934a61ae042b289 --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_262k_l0_small/config.json b/mlp_out/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3a4a6ed3974dbf82c4e702deef2fd3667b0929a --- /dev/null +++ b/mlp_out/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_big/config.json b/mlp_out/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..868f0c93243b336f7020efc5071fff7b8b3a638d --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_medium/config.json b/mlp_out/layer_17_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6b6759987e396824950e6cb591035caaedd3b91a --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_17_width_65k_l0_small/config.json b/mlp_out/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26a67a50083cef2e2b77e619fc39cd90ce47fdbb --- /dev/null +++ b/mlp_out/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_big/config.json b/mlp_out/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..986a1d98e6511f22493d19f655b1560112e76099 --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_medium/config.json b/mlp_out/layer_22_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a3b12a9a3e56f8f197647af0a79b0e28e701cd16 --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_16k_l0_small/config.json b/mlp_out/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e34c41a9d9647a1801efd58e438e3fab077eceff --- /dev/null +++ b/mlp_out/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_big/config.json b/mlp_out/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8921a3f9d40eb86187fd7957127256f98a45ab2f --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_medium/config.json b/mlp_out/layer_22_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1304a22ff4ac139a2db18b9b475629deaf8b1d5b --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_262k_l0_small/config.json b/mlp_out/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..61505d527dead2d7dbfdeba5ae56907bbd14a51d --- /dev/null +++ b/mlp_out/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_big/config.json b/mlp_out/layer_22_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fab208b7081b85b1a52d6246c2e357bbd1c86a23 --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_medium/config.json b/mlp_out/layer_22_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f02b71ce9b1444a6c47a94d0e6bf99276db8ac2f --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_22_width_65k_l0_small/config.json b/mlp_out/layer_22_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..190dd04fd65dc9cabe6cf992ddf1dd7db889720d --- /dev/null +++ b/mlp_out/layer_22_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_16k_l0_big/config.json b/mlp_out/layer_29_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39e9b2e8c0ecf9356897514f225f1a7eb4172e86 --- /dev/null +++ b/mlp_out/layer_29_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_16k_l0_medium/config.json b/mlp_out/layer_29_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab0aaa04d5e60268391e870ce896c575a29067c --- /dev/null +++ b/mlp_out/layer_29_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_16k_l0_small/config.json b/mlp_out/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8498b76402506d94625cf0b0021ec5b11b934698 --- /dev/null +++ b/mlp_out/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_262k_l0_big/config.json b/mlp_out/layer_29_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0852eef41cca5b83cbc84d36bc175fa40f3dc838 --- /dev/null +++ b/mlp_out/layer_29_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_262k_l0_medium/config.json b/mlp_out/layer_29_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..85a29d3089838f157b7d2d2fb53cba36016a2b15 --- /dev/null +++ b/mlp_out/layer_29_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_262k_l0_small/config.json b/mlp_out/layer_29_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff343c66431166b07f7077db01b757af956e88c8 --- /dev/null +++ b/mlp_out/layer_29_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_65k_l0_big/config.json b/mlp_out/layer_29_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..deb6abe08ad8f3fbf70b9ee8fe1fc8ffb853c441 --- /dev/null +++ b/mlp_out/layer_29_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_65k_l0_medium/config.json b/mlp_out/layer_29_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d6d0acbf469ea15b5bda657b98547f02233f250c --- /dev/null +++ b/mlp_out/layer_29_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_29_width_65k_l0_small/config.json b/mlp_out/layer_29_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c98b3bd4ef6c287b43d64ffd1978fe0b751ea2b --- /dev/null +++ b/mlp_out/layer_29_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_16k_l0_big/config.json b/mlp_out/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8e23839aa16f319d1fbfff341dbab659625f80 --- /dev/null +++ b/mlp_out/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_16k_l0_medium/config.json b/mlp_out/layer_9_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44aa77574fde8b77a9336a3a63d65da12400a513 --- /dev/null +++ b/mlp_out/layer_9_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_16k_l0_small/config.json b/mlp_out/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..15ea5be9f1b2f9f54d9c0636ddaca652685aade5 --- /dev/null +++ b/mlp_out/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_262k_l0_big/config.json b/mlp_out/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b8e34e213e9c7250b7e698e89ca56615392f47e3 --- /dev/null +++ b/mlp_out/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_262k_l0_medium/config.json b/mlp_out/layer_9_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11ff751d767af5d812ad6acbdf09cc849ddb13df --- /dev/null +++ b/mlp_out/layer_9_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_262k_l0_small/config.json b/mlp_out/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..194ebd8fd6154fb4429760fe6175da20c8650f0b --- /dev/null +++ b/mlp_out/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_65k_l0_big/config.json b/mlp_out/layer_9_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7138572fabdffbbdc3692a20ce03d929ce621051 --- /dev/null +++ b/mlp_out/layer_9_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 131, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_65k_l0_medium/config.json b/mlp_out/layer_9_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..051683a86653c01f13f14a97c5df182386fa96dd --- /dev/null +++ b/mlp_out/layer_9_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/mlp_out/layer_9_width_65k_l0_small/config.json b/mlp_out/layer_9_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ab9052e1442d723630c7b73309a852e9265edc5 --- /dev/null +++ b/mlp_out/layer_9_width_65k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_big/config.json b/resid_post/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..deac3f3ed72e2d8a96ad477bc52b0454f5517ae6 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_16k_l0_medium/config.json b/resid_post/layer_17_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ae4be207792041bad5aabb21420983600fc03b65 --- /dev/null +++ b/resid_post/layer_17_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_big/config.json b/resid_post/layer_17_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23837aa50ceff6f3ee0320becd57700016e29970 --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_1m_l0_medium/config.json b/resid_post/layer_17_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc00f40b6fc903004027fb75947794d3bd7185e --- /dev/null +++ b/resid_post/layer_17_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_262k_l0_big/config.json b/resid_post/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..24de929bf91892960ea16345c9308823416c30b3 --- /dev/null +++ b/resid_post/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_big/config.json b/resid_post/layer_17_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7fd2bfb650bff4d612830fa21f858a9970ca8aba --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_16k_l0_small/config.json b/resid_post/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec25fb5ed4d2814a072225d5ae6229c7069cd05d --- /dev/null +++ b/resid_post/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_big/config.json b/resid_post/layer_22_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e2e05c1a6461b747264f5d2aa8a0b515ab820698 --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_1m_l0_medium/config.json b/resid_post/layer_22_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d3374ad9157b0a51676c9777f164d4e6fb51ce52 --- /dev/null +++ b/resid_post/layer_22_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_22_width_262k_l0_big/config.json b/resid_post/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..739d2545bf6ff7384b117ca3dec7f8a6b94bdf12 --- /dev/null +++ b/resid_post/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_29_width_16k_l0_big/config.json b/resid_post/layer_29_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f01377700ca37a45071d0d4c34d2b9e32d322a88 --- /dev/null +++ b/resid_post/layer_29_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_29_width_16k_l0_small/config.json b/resid_post/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3bdeb8ccbcf488d3d1d99e8772022fd899db35b2 --- /dev/null +++ b/resid_post/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_29_width_262k_l0_big/config.json b/resid_post/layer_29_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9ec197902e60dabf50edff7f1997cb04f27ddfa9 --- /dev/null +++ b/resid_post/layer_29_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_29_width_262k_l0_medium/config.json b/resid_post/layer_29_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e7ebf8a4f89d1d37d6a207eade08f171e07d3694 --- /dev/null +++ b/resid_post/layer_29_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_medium/config.json b/resid_post/layer_9_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c97d4e49a3006de49234881ba1ece3249098e87 --- /dev/null +++ b/resid_post/layer_9_width_16k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_medium/config.json b/resid_post/layer_9_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdd606e42b19a4fdcce375084c5dc0f7d676eb4d --- /dev/null +++ b/resid_post/layer_9_width_1m_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_small/config.json b/resid_post/layer_9_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f3b741e37b83229e5f1310d3aaddba53a5ab265 --- /dev/null +++ b/resid_post/layer_9_width_1m_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 1048576, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium/config.json b/resid_post/layer_9_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee337356bb97675e574b07fe24f51b79e2c83ef --- /dev/null +++ b/resid_post/layer_9_width_262k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee337356bb97675e574b07fe24f51b79e2c83ef --- /dev/null +++ b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_small/config.json b/resid_post/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b5958b7e6f2781e8b8e5afe66bd8e8d1926860b7 --- /dev/null +++ b/resid_post/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_medium/config.json b/resid_post/layer_9_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0a1a8ef66268d84ba8f9fb57af103cf60e8bef0 --- /dev/null +++ b/resid_post/layer_9_width_65k_l0_medium/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 65536, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 53, + "affine_connection": false, + "type": "sae" +} \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small/config.json b/transcoder_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39421e59b8c3684d2cc8c4df3dc71db691262b63 --- /dev/null +++ b/transcoder_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_big_affine/config.json b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..38053fa0ff6bfb6c6b7123df774956b0b0a3e445 --- /dev/null +++ b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ecd67594903c6c6b889eaa7ff760db7a4d4aee5a --- /dev/null +++ b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small/config.json b/transcoder_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c3f97322a618b65fbe8893b65d4dfbf77347ee92 --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small_affine/config.json b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1164730a7f6bec540cce2e93d0e8d22b5a30abe3 --- /dev/null +++ b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_big/config.json b/transcoder_all/layer_11_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f6ba7ce5095ad5c2cb1b9bd1845ddcd8c3421396 --- /dev/null +++ b/transcoder_all/layer_11_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 118, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9f2405d46560671c8492a50be2fb51c8ad87aace --- /dev/null +++ b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small/config.json b/transcoder_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ac01cf6929c4b0daeee6d69f89e8d4b46aefe49e --- /dev/null +++ b/transcoder_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big/config.json b/transcoder_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5f451b3ce0d978fe979119d583d73ffe4f83b83c --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_small/config.json b/transcoder_all/layer_14_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a9f104165501172718f83906cf1f1589ee019b4b --- /dev/null +++ b/transcoder_all/layer_14_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_big/config.json b/transcoder_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..af725aa256807a17399796772ec29530f0c1d5a3 --- /dev/null +++ b/transcoder_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big/config.json b/transcoder_all/layer_15_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d7ea45b940fc64cca1cf288021d6d6ba9a10fc1 --- /dev/null +++ b/transcoder_all/layer_15_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small/config.json b/transcoder_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b6e41fb394c851c52f6b5459e02bec083b2e62d1 --- /dev/null +++ b/transcoder_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_small_affine/config.json b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0066bf167be8c8d686b5ad89151e9775a358fd7c --- /dev/null +++ b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big/config.json b/transcoder_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b37d68e08d8fa325947e70b02ac1a54dadf7146 --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big_affine/config.json b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..536aa0f00a9a049a39a018647cc9af244318be84 --- /dev/null +++ b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small/config.json b/transcoder_all/layer_1_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0c38ff05ab535d96921d1baec927d05e414887 --- /dev/null +++ b/transcoder_all/layer_1_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_big_affine/config.json b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6732259b3d15aff58c1fca4dd13237614f9e0d65 --- /dev/null +++ b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_big/config.json b/transcoder_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d78cbe5494d4357c0fe7be1271122b1c706550 --- /dev/null +++ b/transcoder_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big/config.json b/transcoder_all/layer_22_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ebc5f599404bb80ae14f9d30c3a1ad49e54f45e --- /dev/null +++ b/transcoder_all/layer_22_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_big/config.json b/transcoder_all/layer_23_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32a7dbccf17516c6f6b173e214242170b97c6c5b --- /dev/null +++ b/transcoder_all/layer_23_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_small/config.json b/transcoder_all/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39153dc21554fbdb1942574b47061fb3e49946ec --- /dev/null +++ b/transcoder_all/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small/config.json b/transcoder_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aa8971a89d37b15c53da72e24979079433ab5174 --- /dev/null +++ b/transcoder_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_small_affine/config.json b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..24a00e18b3fb7b63f5ed55b591cd5094e4904cab --- /dev/null +++ b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_big_affine/config.json b/transcoder_all/layer_26_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aa9186519c4b6ab017576514205c442960c22845 --- /dev/null +++ b/transcoder_all/layer_26_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_big_affine/config.json b/transcoder_all/layer_27_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e91f8f8d93a28d63f9bbfb05ec93a55c75b9f3d5 --- /dev/null +++ b/transcoder_all/layer_27_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_small_affine/config.json b/transcoder_all/layer_27_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c99401ea105673a9c441ba175bcf9d0ead48933 --- /dev/null +++ b/transcoder_all/layer_27_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_28_width_16k_l0_small_affine/config.json b/transcoder_all/layer_28_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4f69c08fa1d4223a0be489e9d452871b75e28ea0 --- /dev/null +++ b/transcoder_all/layer_28_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_29_width_262k_l0_small/config.json b/transcoder_all/layer_29_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0c0743bfbcc209a48c8831ab2b9ffd9028108b4d --- /dev/null +++ b/transcoder_all/layer_29_width_262k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big_affine/config.json b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b46a2750ee95f419a1a9cbd7a5d12a0952111dd8 --- /dev/null +++ b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 70, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big_affine/config.json b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fd77f1198603ac7310a77594ff1c6e2a8cd1346 --- /dev/null +++ b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 70, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_30_width_262k_l0_big/config.json b/transcoder_all/layer_30_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..41015d66b14ea36d03221cf78d3aa3a0a6f640df --- /dev/null +++ b/transcoder_all/layer_30_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_big/config.json b/transcoder_all/layer_31_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f0cc8881588c458f9f2d1e9b1f1d52a3ac51445f --- /dev/null +++ b/transcoder_all/layer_31_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_32_width_262k_l0_big_affine/config.json b/transcoder_all/layer_32_width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7af7ad01a2aed555cdb5e2fa601a52186877277a --- /dev/null +++ b/transcoder_all/layer_32_width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_33_width_16k_l0_small_affine/config.json b/transcoder_all/layer_33_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4c6944b2973e824461c6123afdd23c922cef3fd1 --- /dev/null +++ b/transcoder_all/layer_33_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_big/config.json b/transcoder_all/layer_33_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b9d70f58faf022667e4715a5c33b24b68b93775 --- /dev/null +++ b/transcoder_all/layer_33_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c0845513f0c5b1f648d66025c63ae796993088f3 --- /dev/null +++ b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big/config.json b/transcoder_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..544084677917674d89dd6b9e98e7d00a9fc71e6a --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 75, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c812ee28bfa49b598bab5dbe2ba0b03050722718 --- /dev/null +++ b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big/config.json b/transcoder_all/layer_5_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..71deb0934f0626a5347d0256b387d0f2aa04377b --- /dev/null +++ b/transcoder_all/layer_5_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 86, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6644cf457b190cb4fdd9812aeede2ad22cdaf76e --- /dev/null +++ b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_small/config.json b/transcoder_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8bba8e7958a59d47c0eec1c6b90325895366c1bc --- /dev/null +++ b/transcoder_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_small_affine/config.json b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9cc9da77f325f05ffc07ea554575dbb78df39696 --- /dev/null +++ b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big/config.json b/transcoder_all/layer_9_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd33228e1fc0409dd8437deb46e73a01a2b37b8e --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 107, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small/config.json b/transcoder_all/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..24aff2fd0b6e371b1744645afb0427a730fd0584 --- /dev/null +++ b/transcoder_all/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false, + "type": "transcoder" +} \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e5bf92adb47f403f610f986a6094749872224f3f --- /dev/null +++ b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "google/gemma-3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": true, + "type": "transcoder" +} \ No newline at end of file