diff --git a/attn_out_all/layer_10_width_262k_l0_small/config.json b/attn_out_all/layer_10_width_262k_l0_small/config.json index b5dfcc498e9a073b53581e174cd32f72214d5d24..361d0380d4fdd07a2df40324ec43d828ffd0ae49 100644 --- a/attn_out_all/layer_10_width_262k_l0_small/config.json +++ b/attn_out_all/layer_10_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_11_width_262k_l0_big/config.json b/attn_out_all/layer_11_width_262k_l0_big/config.json index 7bce2b80f4852d1937280ba305080b44c7d1897a..d0a759eeaca84de7ded05f06b4b3e0a3cddbd2ed 100644 --- a/attn_out_all/layer_11_width_262k_l0_big/config.json +++ b/attn_out_all/layer_11_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_12_width_16k_l0_big/config.json b/attn_out_all/layer_12_width_16k_l0_big/config.json index aca5daba0aa0c9b10843f953ea6dda9f7d8e2646..225d19921e336f66aacc69116adfe18b0477d4f4 100644 --- a/attn_out_all/layer_12_width_16k_l0_big/config.json +++ b/attn_out_all/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_12_width_16k_l0_small/config.json b/attn_out_all/layer_12_width_16k_l0_small/config.json index 29b5ac659ab546465baaa5dc1977741db90c4219..396a62dc28cf4f349072ba92c1d645a7191f4fb8 100644 --- a/attn_out_all/layer_12_width_16k_l0_small/config.json +++ b/attn_out_all/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_12_width_262k_l0_big/config.json b/attn_out_all/layer_12_width_262k_l0_big/config.json index 2e1fc5e1b6928c0259588d09308b27a73717c0b5..608b22314efd3bc0b31ef8635d9d20be41a60f4d 100644 --- a/attn_out_all/layer_12_width_262k_l0_big/config.json +++ b/attn_out_all/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_12_width_262k_l0_small/config.json b/attn_out_all/layer_12_width_262k_l0_small/config.json index 3da5a1b1e67e845033f8054af063c1f0aade6a3d..429ef796304fc94424d56ab7434f1e942692519c 100644 --- a/attn_out_all/layer_12_width_262k_l0_small/config.json +++ b/attn_out_all/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_big/config.json b/attn_out_all/layer_13_width_262k_l0_big/config.json index afaa6e3a12418945c257001d93d4a69cb0f5df22..5034dce21d6bb870c409812969b7da533a47847a 100644 --- a/attn_out_all/layer_13_width_262k_l0_big/config.json +++ b/attn_out_all/layer_13_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_small/config.json b/attn_out_all/layer_13_width_262k_l0_small/config.json index 0b020cd7fe05a4eb7232a61f124cdb0ecc58cb83..d90c8ec5fd4f02b26980c2b918f44a5170c18435 100644 --- a/attn_out_all/layer_13_width_262k_l0_small/config.json +++ b/attn_out_all/layer_13_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_14_width_16k_l0_small/config.json b/attn_out_all/layer_14_width_16k_l0_small/config.json index b3ea3ab29c169fdeb38197f33bfcf1ce31acd560..9e0d2b31fdbf54e919866a7e8038cba9d9e08b3f 100644 --- a/attn_out_all/layer_14_width_16k_l0_small/config.json +++ b/attn_out_all/layer_14_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_14_width_262k_l0_big/config.json b/attn_out_all/layer_14_width_262k_l0_big/config.json index 283b16fe1ebeb1e480f6e90cee116fc9c3be1315..84643d166703266ad1c7997d7dc524a7a2bbbb3e 100644 --- a/attn_out_all/layer_14_width_262k_l0_big/config.json +++ b/attn_out_all/layer_14_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.14.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_15_width_16k_l0_small/config.json b/attn_out_all/layer_15_width_16k_l0_small/config.json index 8af587587fbb3f3aff89e019e7c99354605214f0..6f506a881310f8aa58c22325ca750b68dc80f10d 100644 --- a/attn_out_all/layer_15_width_16k_l0_small/config.json +++ b/attn_out_all/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_15_width_262k_l0_small/config.json b/attn_out_all/layer_15_width_262k_l0_small/config.json index 3ab9c7f82922964f336399667721e6e876c7b624..8bbcb0c822eebdd7d33f2c05df610e86ee39c104 100644 --- a/attn_out_all/layer_15_width_262k_l0_small/config.json +++ b/attn_out_all/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_16_width_16k_l0_big/config.json b/attn_out_all/layer_16_width_16k_l0_big/config.json index 0d849adf7f6d0523400e9e75a2206fe37127c13b..72b0980d447f15e7023e32d62d16a99916ae1280 100644 --- a/attn_out_all/layer_16_width_16k_l0_big/config.json +++ b/attn_out_all/layer_16_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_16_width_16k_l0_small/config.json b/attn_out_all/layer_16_width_16k_l0_small/config.json index ecd49d43cef32d352a1f1d4da0ff2eeedf149039..460efdb9d88172baec1538f176f0bc17bda4ef70 100644 --- a/attn_out_all/layer_16_width_16k_l0_small/config.json +++ b/attn_out_all/layer_16_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_16_width_262k_l0_big/config.json b/attn_out_all/layer_16_width_262k_l0_big/config.json index c6aa890332e4784c7d15cdb5341b80f9be6d384d..c5457240a39d61c0328ee977fd10f7e38517bc10 100644 --- a/attn_out_all/layer_16_width_262k_l0_big/config.json +++ b/attn_out_all/layer_16_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.16.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_1_width_16k_l0_big/config.json b/attn_out_all/layer_1_width_16k_l0_big/config.json index 4327e3478d0e536b72e1d2804755a06455b01fed..513702c6fd6c6a6686fa15c963355d5722d7531e 100644 --- a/attn_out_all/layer_1_width_16k_l0_big/config.json +++ b/attn_out_all/layer_1_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 70, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_1_width_16k_l0_small/config.json b/attn_out_all/layer_1_width_16k_l0_small/config.json index 92c892b8fee9b04681b2a7030b16334e4b3506cd..06e91cdd11b0832fbf6cb9cd02e34f69bc7fdc60 100644 --- a/attn_out_all/layer_1_width_16k_l0_small/config.json +++ b/attn_out_all/layer_1_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_1_width_262k_l0_big/config.json b/attn_out_all/layer_1_width_262k_l0_big/config.json index 578acbf6e999cf6a0866c66932d4730e9415832e..22143d9bd7de69df3de5adfb41669586f28b66bc 100644 --- a/attn_out_all/layer_1_width_262k_l0_big/config.json +++ b/attn_out_all/layer_1_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 70, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_1_width_262k_l0_small/config.json b/attn_out_all/layer_1_width_262k_l0_small/config.json index 6d4015821e11c3bdb61f2eac53710e5682d8e89c..93ea5c39fe202eb6177db0ba181393310ff4ca3d 100644 --- a/attn_out_all/layer_1_width_262k_l0_small/config.json +++ b/attn_out_all/layer_1_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_3_width_262k_l0_big/config.json b/attn_out_all/layer_3_width_262k_l0_big/config.json index a14551633380e97df56ad496aede61f888883cf0..d2da4be6ecc43e2fa2242fec0899fc10954c29c5 100644 --- a/attn_out_all/layer_3_width_262k_l0_big/config.json +++ b/attn_out_all/layer_3_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 90, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_4_width_262k_l0_small/config.json b/attn_out_all/layer_4_width_262k_l0_small/config.json index 9dfb2d5a8fb0d6c93ccaa1dd347457ec647e08a7..d6a5f3da5432ffb54f822dd1f11605923f7c5048 100644 --- a/attn_out_all/layer_4_width_262k_l0_small/config.json +++ b/attn_out_all/layer_4_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.4.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_5_width_262k_l0_small/config.json b/attn_out_all/layer_5_width_262k_l0_small/config.json index 13ce70a30ef2f5d4e4bb2dc4e91b034350ff9723..b5e8cb951558abe70757551c3695fc0ca5490d46 100644 --- a/attn_out_all/layer_5_width_262k_l0_small/config.json +++ b/attn_out_all/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_6_width_16k_l0_big/config.json b/attn_out_all/layer_6_width_16k_l0_big/config.json index be008c3bbb6763752ce5b858b3ce3ed5856f6745..6eaf06d3d83ad8a817d978f9715da8221d303b27 100644 --- a/attn_out_all/layer_6_width_16k_l0_big/config.json +++ b/attn_out_all/layer_6_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_6_width_262k_l0_big/config.json b/attn_out_all/layer_6_width_262k_l0_big/config.json index 0b3a8e9a214642b9b8f51178b5f3679546426d42..fa99a1cf22cf84e0db1c1b9dd7b6508d55000163 100644 --- a/attn_out_all/layer_6_width_262k_l0_big/config.json +++ b/attn_out_all/layer_6_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_6_width_262k_l0_small/config.json b/attn_out_all/layer_6_width_262k_l0_small/config.json index dfe5f0eb86e6b1edd12422ae85a827073a5759fa..eff0437ade1c58a97c6584f28dcc50b144139e65 100644 --- a/attn_out_all/layer_6_width_262k_l0_small/config.json +++ b/attn_out_all/layer_6_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_8_width_16k_l0_small/config.json b/attn_out_all/layer_8_width_16k_l0_small/config.json index e552045de545f5c3b8dd77824b211c704e9fabe2..92dc9fedaa3b16ac18b3af62a0f5693cddb5d36a 100644 --- a/attn_out_all/layer_8_width_16k_l0_small/config.json +++ b/attn_out_all/layer_8_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.8.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_9_width_16k_l0_big/config.json b/attn_out_all/layer_9_width_16k_l0_big/config.json index 229756451ab14be5160c194e8d96580328cb75d1..98a321f593cd9bfa81afee44aba1c6428113a16d 100644 --- a/attn_out_all/layer_9_width_16k_l0_big/config.json +++ b/attn_out_all/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_9_width_262k_l0_small/config.json b/attn_out_all/layer_9_width_262k_l0_small/config.json index 96caefc3b99925a09474b3f5cc6830a0e092e290..21e453a2e435d44a3da6831fbf9897bd995a1259 100644 --- a/attn_out_all/layer_9_width_262k_l0_small/config.json +++ b/attn_out_all/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/clt/width_262k_l0_big_affine/config.json b/clt/width_262k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..70f548809d9118b4d432f577474bd61656f7ea20 --- /dev/null +++ b/clt/width_262k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", + "width": 262080, + "model_name": "google/gemma-3-270m-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "clt" +} \ No newline at end of file diff --git a/clt/width_524k_l0_big/config.json b/clt/width_524k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..715a6c00fc1af493d71afaaf96a83caa3be27c52 --- /dev/null +++ b/clt/width_524k_l0_big/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", + "width": 524160, + "model_name": "google/gemma-3-270m-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false, + "type": "clt" +} \ No newline at end of file diff --git a/clt/width_524k_l0_big_affine/config.json b/clt/width_524k_l0_big_affine/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5619918e6e4c7517a54e03fdb6081bc667a7a65d --- /dev/null +++ b/clt/width_524k_l0_big_affine/config.json @@ -0,0 +1,10 @@ +{ + "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", + "width": 524160, + "model_name": "google/gemma-3-270m-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": true, + "type": "clt" +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_big/config.json b/mlp_out_all/layer_0_width_16k_l0_big/config.json index 5b39a4d16f0839fa34e6339d49bc67bc7e0045e0..46de4902128a55b3ba276702490dbc2c146cc6ef 100644 --- a/mlp_out_all/layer_0_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_0_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_small/config.json b/mlp_out_all/layer_0_width_16k_l0_small/config.json index 89d6cba8572ca3d2e17d14ad6b1a2176d93c7e4e..a9fc7ebaa94d333a103ed30625dcc7ad935bcf86 100644 --- a/mlp_out_all/layer_0_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_0_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_big/config.json b/mlp_out_all/layer_0_width_262k_l0_big/config.json index 18d2faca08891efca7010f01c6620ecda47b2ab0..f571c01aa9b7b39201df17ae0004b6b0d9d0bad2 100644 --- a/mlp_out_all/layer_0_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_0_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json index a4520b7657456db85278ed28bb611aaa180b432e..78af82af68b1e9c9d0b3f188b05ebbbcb8aee03b 100644 --- a/mlp_out_all/layer_0_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_big/config.json b/mlp_out_all/layer_10_width_16k_l0_big/config.json index ddfc741bb9af7aa6bef10ae61230f6146ef4b72e..0c7cced4ca0a883f39f8dd71d6097ed147f910eb 100644 --- a/mlp_out_all/layer_10_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_10_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_small/config.json b/mlp_out_all/layer_10_width_16k_l0_small/config.json index 3d3b76ed2bf356072a5ca44d307fc94afb087702..1e397a6d2ca74068df50626ea7e819a0afc135f4 100644 --- a/mlp_out_all/layer_10_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_10_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_big/config.json b/mlp_out_all/layer_10_width_262k_l0_big/config.json index f75a852c0e207847178327c3744e1fc5538369bf..aa48fec11817cf65a49c1e95745e9fe012d9a1d5 100644 --- a/mlp_out_all/layer_10_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_10_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_big/config.json b/mlp_out_all/layer_11_width_16k_l0_big/config.json index 4ea92fa64db24c264806d312a21787b985d5c085..eecbfef4980edace32f0df0d462cc7f34dbd9f48 100644 --- a/mlp_out_all/layer_11_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_11_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_small/config.json b/mlp_out_all/layer_11_width_16k_l0_small/config.json index 3cae67c396451bafb74d2e68c4f27df91447f4e0..9e3e809647db3e88ba5415e082a99cf314ae0d66 100644 --- a/mlp_out_all/layer_11_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_11_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_262k_l0_small/config.json b/mlp_out_all/layer_11_width_262k_l0_small/config.json index 36ac9f731b6119fbe8b17383c39666da3ef44324..76825fecc9ffa7b17f12952072faf3c5b65b91e9 100644 --- a/mlp_out_all/layer_11_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_11_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_big/config.json b/mlp_out_all/layer_13_width_16k_l0_big/config.json index e30c90aa2a45131be6cf2602265825aa5dd7ba54..a291d63a6c764e19855af9ea48c369cbe4fddd7a 100644 --- a/mlp_out_all/layer_13_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_13_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_small/config.json b/mlp_out_all/layer_13_width_16k_l0_small/config.json index 43cec8ab7182619abc7e126b8ed53ea3b7cce855..2f16d177da0f0c7a625a82ee8231245a35b64d10 100644 --- a/mlp_out_all/layer_13_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_13_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_big/config.json b/mlp_out_all/layer_14_width_16k_l0_big/config.json index 0dc7c48fcee9f871cafb58ee31ecef4f9968951d..6f4a05f52caae6634688fc0b9bd6b636aae68294 100644 --- a/mlp_out_all/layer_14_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_14_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_small/config.json b/mlp_out_all/layer_14_width_262k_l0_small/config.json index 2f386af075e39d4ee44a4cb16fa5a1ca0f974028..88114e4cab4f699203950aaef3952d416009c0bb 100644 --- a/mlp_out_all/layer_14_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_14_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_big/config.json b/mlp_out_all/layer_15_width_16k_l0_big/config.json index 3225092e67831e863037f9a3493b47e725c730c2..1983e6fec2d1f472bc638447aee76ce229b0fe50 100644 --- a/mlp_out_all/layer_15_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_big/config.json b/mlp_out_all/layer_15_width_262k_l0_big/config.json index e05ebb7eedc5f05b74f205cc57eec9a4495d4c07..0d9241f018fb29571dac049fd31994224844ce32 100644 --- a/mlp_out_all/layer_15_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_small/config.json b/mlp_out_all/layer_16_width_262k_l0_small/config.json index ae6c353d1fc0bf3f6ee9d61dc3ec25e6d6969b84..d529d181cbb97ac424dce77e5c9a276aeaa47fe2 100644 --- a/mlp_out_all/layer_16_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_16_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_big/config.json b/mlp_out_all/layer_17_width_16k_l0_big/config.json index f82d943a62eade9f904abfef3981971fe774de6f..99b012f380d3cde30d63373d623b901d1b31aa08 100644 --- a/mlp_out_all/layer_17_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_17_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_small/config.json b/mlp_out_all/layer_17_width_16k_l0_small/config.json index 54b429fd6e3734584d462b921e02483b7b480988..ab09d2f69f1c15ad7e3a348338f57d7de49bfeb2 100644 --- a/mlp_out_all/layer_17_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_17_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_big/config.json b/mlp_out_all/layer_17_width_262k_l0_big/config.json index fe8da18bbc2f6dad3abd1be835c5431cd188c28c..e9d46fa9d2aff080992986056c471dbacadab443 100644 --- a/mlp_out_all/layer_17_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_17_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_small/config.json b/mlp_out_all/layer_17_width_262k_l0_small/config.json index c58764f4c8a78c4305bb88f8a094be77771c4bb0..68faf82a0c272e35a9faf6ce8d662567c62b894b 100644 --- a/mlp_out_all/layer_17_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_17_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_big/config.json b/mlp_out_all/layer_2_width_16k_l0_big/config.json index 6114a6632864223b561e9bf5fc5f8356ed37788a..411c245c1d197db1856ce871e650c92af270aab3 100644 --- a/mlp_out_all/layer_2_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_2_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_small/config.json b/mlp_out_all/layer_2_width_16k_l0_small/config.json index ed4ff49c1924675f40029f9e6a0ec8e72cd657c7..8749a540f2028898f8c001f4390d2109f0f371ce 100644 --- a/mlp_out_all/layer_2_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_2_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_big/config.json b/mlp_out_all/layer_2_width_262k_l0_big/config.json index 8d81d9653bf67f232512584f3f94b59aa6fded49..a8482c3a5eec3a9c1b01849cd4f9a18323425ba3 100644 --- a/mlp_out_all/layer_2_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_2_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_small/config.json b/mlp_out_all/layer_2_width_262k_l0_small/config.json index 40a1faf44bb4dddfa9d8998db81d938b586a727a..1073d620d8e17355bd3052ee01f679b62c39356d 100644 --- a/mlp_out_all/layer_2_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_2_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_big/config.json b/mlp_out_all/layer_3_width_16k_l0_big/config.json index 88f295d1cae2758222f730858d76dd749857744f..93be5679798ac8c7291d5877d5aec74e52d8e3c1 100644 --- a/mlp_out_all/layer_3_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_3_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 90, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_small/config.json b/mlp_out_all/layer_3_width_16k_l0_small/config.json index aed56bf8572aac6d3ec479389142211fce66936c..180da4ad56056d9507d0b33b36e890e2063c22dd 100644 --- a/mlp_out_all/layer_3_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_3_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_small/config.json b/mlp_out_all/layer_3_width_262k_l0_small/config.json index 9f214248bab87c466f1108ae49318d99c580f8dc..1b72365ff2cf120b725ee0d9c05ba9c1d6d744ee 100644 --- a/mlp_out_all/layer_3_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_3_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_big/config.json b/mlp_out_all/layer_4_width_16k_l0_big/config.json index c5a5db4ccb7fd2dd2fc4575607576bb660a4eda9..9e40fe63acd7d64d5016df65830c1595bf4dd57c 100644 --- a/mlp_out_all/layer_4_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_4_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_big/config.json b/mlp_out_all/layer_4_width_262k_l0_big/config.json index 956474b54126b2bd2e25eceb9799daaf01122776..fc98a2bacab1a741c72bdb1547e9d4b9c726434b 100644 --- a/mlp_out_all/layer_4_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_4_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_big/config.json b/mlp_out_all/layer_5_width_16k_l0_big/config.json index b01f07ee2638a1fefffbfd15f8a0ebb50042ed0e..1c0f90e8dff3a333ac749a0c9c69642692a0f738 100644 --- a/mlp_out_all/layer_5_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_small/config.json b/mlp_out_all/layer_5_width_16k_l0_small/config.json index 10784f014dd7bdd20db058ef0159a0bb74d016c1..63c8a46970b76808f99924d2bcf2f9f59579abe3 100644 --- a/mlp_out_all/layer_5_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_5_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_big/config.json b/mlp_out_all/layer_5_width_262k_l0_big/config.json index 382578d42b34b1afe3f7dd6fb9dbf2df032eeaa6..001200d29c4dd2edc07f013e9d7caa194fe36217 100644 --- a/mlp_out_all/layer_5_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_small/config.json b/mlp_out_all/layer_6_width_16k_l0_small/config.json index 9414c407e31cbd562577a503ab4557f533795066..029c146ef1f5d977ed66ee8de7893a8d6326ba78 100644 --- a/mlp_out_all/layer_6_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_6_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json index 1e1e6c31690c6ff2c94718ba164beb8e2c5c383f..62a1f743a6cf4d8d5957dfb0af3fbda2adf149bc 100644 --- a/mlp_out_all/layer_7_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_small/config.json b/mlp_out_all/layer_7_width_16k_l0_small/config.json index e57e516390e3dea62053876f124f962495b8a713..f48d2aff6c76bc9f737757e98d964284c4925b69 100644 --- a/mlp_out_all/layer_7_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_7_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_big/config.json b/mlp_out_all/layer_7_width_262k_l0_big/config.json index f66155c110765c04c447ecba788c80f6828f32e9..b34616dd187c669122eef0d4b7c94423616ec94b 100644 --- a/mlp_out_all/layer_7_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_7_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_small/config.json b/mlp_out_all/layer_7_width_262k_l0_small/config.json index f3e9b45a7b109d135674e79174715e7b06aafe68..6c5779d33e4084d706d526c9e88c35385eed4440 100644 --- a/mlp_out_all/layer_7_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_7_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_big/config.json b/mlp_out_all/layer_8_width_16k_l0_big/config.json index ee82f7f16da75b3c4d7e33aca2342a6b52984008..c8e9c56ff46d1cc844b813369f6cf9534c519b21 100644 --- a/mlp_out_all/layer_8_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_8_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_big/config.json b/mlp_out_all/layer_8_width_262k_l0_big/config.json index 18c9723c16b0cd7254e103947a9dc67c8e6ff3aa..185e762bef8fae145fc5eea3bd7a03ce3ac06a67 100644 --- a/mlp_out_all/layer_8_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_8_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_16k_l0_small/config.json b/mlp_out_all/layer_9_width_16k_l0_small/config.json index cd3b7db5c02977c5c6c0d825a2b1a85aee21c582..7d19da4dc4a8f951e3e0ff23ac9b5b9dafccee16 100644 --- a/mlp_out_all/layer_9_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_big/config.json b/mlp_out_all/layer_9_width_262k_l0_big/config.json index 6b7233c46a9aa30cc672c61e59cd2956067107c2..7035ce4990293e560d57a0bebdf6789ddb04b609 100644 --- a/mlp_out_all/layer_9_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_big/config.json b/resid_post/layer_12_width_16k_l0_big/config.json index f826c237d10c98f68cb0794bad72f50ecbc6908c..fdeba97326ec7526e29212643e1c1e27fe78c073 100644 --- a/resid_post/layer_12_width_16k_l0_big/config.json +++ b/resid_post/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_medium/config.json b/resid_post/layer_12_width_16k_l0_medium/config.json index 84a8a70ce0e68403bd5eaf0a08ee9218460cac4c..da86553626467cfda25362caade9fbef8fd12d8f 100644 --- a/resid_post/layer_12_width_16k_l0_medium/config.json +++ b/resid_post/layer_12_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_small/config.json b/resid_post/layer_12_width_16k_l0_small/config.json index bdbc41118ca80baa0635a1ffc26b3f343d2f1822..331a11f97dd2f3ec98197692e8698494a7def988 100644 --- a/resid_post/layer_12_width_16k_l0_small/config.json +++ b/resid_post/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_big/config.json b/resid_post/layer_12_width_1m_l0_big/config.json index bb9fd866d21b618a413e727da7d70653425f4b32..8027de4f56625753ce0fed6e8354ad968585b8cd 100644 --- a/resid_post/layer_12_width_1m_l0_big/config.json +++ b/resid_post/layer_12_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_medium/config.json b/resid_post/layer_12_width_1m_l0_medium/config.json index d214ae167d372115529633e229b266b0d568f029..075a8223337b14a0252f222107ab287945f9876a 100644 --- a/resid_post/layer_12_width_1m_l0_medium/config.json +++ b/resid_post/layer_12_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_small/config.json b/resid_post/layer_12_width_1m_l0_small/config.json index d5f92826a843c66b967a062d868db1ab413ca783..97205a07f4b5c90eee46d6a7853a0188d0aa2baa 100644 --- a/resid_post/layer_12_width_1m_l0_small/config.json +++ b/resid_post/layer_12_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_big/config.json b/resid_post/layer_12_width_262k_l0_big/config.json index 2feee89b4d313aed046b55aab754d91ee8834210..d52f0334d9f29b42c309ddbdd4a1bd00a68bfcd1 100644 --- a/resid_post/layer_12_width_262k_l0_big/config.json +++ b/resid_post/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium/config.json b/resid_post/layer_12_width_262k_l0_medium/config.json index 394af5d04044f1e6eab5caf80efebe5becf64376..122db3c4eecabac2fe5506a4be4111b0c930d173 100644 --- a/resid_post/layer_12_width_262k_l0_medium/config.json +++ b/resid_post/layer_12_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json index 394af5d04044f1e6eab5caf80efebe5becf64376..122db3c4eecabac2fe5506a4be4111b0c930d173 100644 --- a/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_small/config.json b/resid_post/layer_12_width_262k_l0_small/config.json index e09713b37342c0c91afcb79f1289ad668278ae3f..dab84dc8d088c3c8e7bb78f986b8a6f00545d808 100644 --- a/resid_post/layer_12_width_262k_l0_small/config.json +++ b/resid_post/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_big/config.json b/resid_post/layer_12_width_65k_l0_big/config.json index 7973f9a3da19093bddc574bf1802d501419dc96b..49e7355190eab85b62c5102067f18e67b161de44 100644 --- a/resid_post/layer_12_width_65k_l0_big/config.json +++ b/resid_post/layer_12_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_medium/config.json b/resid_post/layer_12_width_65k_l0_medium/config.json index 1ff9e7286bee08eaa47a19011b4d19e4a39be5a5..a4c73e082429402408908e60f77b0ae9039bf039 100644 --- a/resid_post/layer_12_width_65k_l0_medium/config.json +++ b/resid_post/layer_12_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_small/config.json b/resid_post/layer_12_width_65k_l0_small/config.json index a1af9ec0cc85e212b41a5d2acb6eb2e01de9b42e..79e4d8c314243f93de5b6f34188243e50000f5f0 100644 --- a/resid_post/layer_12_width_65k_l0_small/config.json +++ b/resid_post/layer_12_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_big/config.json b/resid_post/layer_15_width_16k_l0_big/config.json index 6784bb2b3abd550103105b76a246ad9c309ab04c..ef53050cf965a4f862333f04ba9b67fa2920531e 100644 --- a/resid_post/layer_15_width_16k_l0_big/config.json +++ b/resid_post/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_medium/config.json b/resid_post/layer_15_width_16k_l0_medium/config.json index 20ddc9179302742c112a98c32893b4b2d5abf671..d51864420d544aa902fc6ed36b217d65c43d92ae 100644 --- a/resid_post/layer_15_width_16k_l0_medium/config.json +++ b/resid_post/layer_15_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_small/config.json b/resid_post/layer_15_width_16k_l0_small/config.json index 697adb2126504cce797abd247a81e2e3434b8938..3dbea1f1f7ccb50ec3dd34b62c0c2f61677d0174 100644 --- a/resid_post/layer_15_width_16k_l0_small/config.json +++ b/resid_post/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_big/config.json b/resid_post/layer_15_width_1m_l0_big/config.json index 0f9543d77a01237232f58f639243ec274d37e99a..78f0f9f6f95baedc9a0fba7b6cdbe96d95149dfa 100644 --- a/resid_post/layer_15_width_1m_l0_big/config.json +++ b/resid_post/layer_15_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_medium/config.json b/resid_post/layer_15_width_1m_l0_medium/config.json index dcf2446de1bb9c1cfb7a4a1d23ad50806b00dd1f..aa399ecbc743812c910e66c53b2319863b4ca408 100644 --- a/resid_post/layer_15_width_1m_l0_medium/config.json +++ b/resid_post/layer_15_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_small/config.json b/resid_post/layer_15_width_1m_l0_small/config.json index b91407ff14d27b6aebc6d830c421de13c457dbf4..f8c0ae5e4c74f2e953b1ba49b02e756a74df35f2 100644 --- a/resid_post/layer_15_width_1m_l0_small/config.json +++ b/resid_post/layer_15_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_big/config.json b/resid_post/layer_15_width_262k_l0_big/config.json index 5006361837b2bef415de39ae72ad07a9987323a1..9bd1e9186d0c143e72084f2bf1e7ed92c6b1305d 100644 --- a/resid_post/layer_15_width_262k_l0_big/config.json +++ b/resid_post/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_medium/config.json b/resid_post/layer_15_width_262k_l0_medium/config.json index e9c072836e3977f181b5013c87f40340355673c4..2523051aae059c58a2960acc6bef6fc964cbe30a 100644 --- a/resid_post/layer_15_width_262k_l0_medium/config.json +++ b/resid_post/layer_15_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json index e9c072836e3977f181b5013c87f40340355673c4..2523051aae059c58a2960acc6bef6fc964cbe30a 100644 --- a/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_small/config.json b/resid_post/layer_15_width_262k_l0_small/config.json index 5c4a856a2116f3537365d984757e24a43e04f9a3..e4e2c995f0781cbb819ee54a1fd822de40b54c02 100644 --- a/resid_post/layer_15_width_262k_l0_small/config.json +++ b/resid_post/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_big/config.json b/resid_post/layer_15_width_65k_l0_big/config.json index 4b4190d708841258f489facae074aada57e813c4..9df4c33528ae2bc1abf18509b0fa93d9ee046249 100644 --- a/resid_post/layer_15_width_65k_l0_big/config.json +++ b/resid_post/layer_15_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_medium/config.json b/resid_post/layer_15_width_65k_l0_medium/config.json index c5850aab2af4c31ddb46d0dc48e4f6c37fd85202..66f44e7b53cf2aeb1dd9ef8341254eee0fad1b25 100644 --- a/resid_post/layer_15_width_65k_l0_medium/config.json +++ b/resid_post/layer_15_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_small/config.json b/resid_post/layer_15_width_65k_l0_small/config.json index 5a42dea83a98348cf38da7992d88959f12dd9fe4..ed972b381bf94beec88a5106999288f27805e463 100644 --- a/resid_post/layer_15_width_65k_l0_small/config.json +++ b/resid_post/layer_15_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_16k_l0_big/config.json b/resid_post/layer_5_width_16k_l0_big/config.json index 0cae03f0dfdc8aae99f26430efa6e67a8021dd94..c29baff69ad69f36dbefda164a9788cb47f5e9e6 100644 --- a/resid_post/layer_5_width_16k_l0_big/config.json +++ b/resid_post/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_16k_l0_medium/config.json b/resid_post/layer_5_width_16k_l0_medium/config.json index 1dffbfd1225b4b8692d0215aae5ee21e848de185..6258694901365445ae97f62db554db3ee1730cc7 100644 --- a/resid_post/layer_5_width_16k_l0_medium/config.json +++ b/resid_post/layer_5_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_16k_l0_small/config.json b/resid_post/layer_5_width_16k_l0_small/config.json index 2dcb168cd43bc556091d381955ab6ffe1679e55f..8ba2534d126bab37f3e266d138a030003196913a 100644 --- a/resid_post/layer_5_width_16k_l0_small/config.json +++ b/resid_post/layer_5_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_big/config.json b/resid_post/layer_5_width_1m_l0_big/config.json index 361289ab97b137fe0d3464d09219f43541b778fd..079a1f0ade005385552586f9e53832ac017211c0 100644 --- a/resid_post/layer_5_width_1m_l0_big/config.json +++ b/resid_post/layer_5_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_medium/config.json b/resid_post/layer_5_width_1m_l0_medium/config.json index 263c59adef870814494aa3a69fd38e1f53dd32d1..a5fa10c3a1b702a47bd3ad16aaeaeb4efd07c015 100644 --- a/resid_post/layer_5_width_1m_l0_medium/config.json +++ b/resid_post/layer_5_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_small/config.json b/resid_post/layer_5_width_1m_l0_small/config.json index 0365e33dc70fb4a4b98762ca7362dee8ba374cce..ee58eb8b133394c7283109530803fa92b28730a5 100644 --- a/resid_post/layer_5_width_1m_l0_small/config.json +++ b/resid_post/layer_5_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_big/config.json b/resid_post/layer_5_width_262k_l0_big/config.json index f6b278a535fb9f367d255452c09f00df0669b5ee..789f4f004a7850f5f5cfbcc9f281c920d8d6f198 100644 --- a/resid_post/layer_5_width_262k_l0_big/config.json +++ b/resid_post/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_medium/config.json b/resid_post/layer_5_width_262k_l0_medium/config.json index d6091f0780e33b7fe149e88767e21b78db044b65..7bde89b98d64111f63594405633d66e51d9fbf05 100644 --- a/resid_post/layer_5_width_262k_l0_medium/config.json +++ b/resid_post/layer_5_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json index d6091f0780e33b7fe149e88767e21b78db044b65..7bde89b98d64111f63594405633d66e51d9fbf05 100644 --- a/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_small/config.json b/resid_post/layer_5_width_262k_l0_small/config.json index 849efababe90effefabb5f6bdc8618ddc841ac81..cc5d70f0419601519a2555de1230abca440fdc31 100644 --- a/resid_post/layer_5_width_262k_l0_small/config.json +++ b/resid_post/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_big/config.json b/resid_post/layer_5_width_65k_l0_big/config.json index 021ca208d942351de0743802539503a92eb86165..426ad213043c72eb67b07ee28292398ac0838eec 100644 --- a/resid_post/layer_5_width_65k_l0_big/config.json +++ b/resid_post/layer_5_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_medium/config.json b/resid_post/layer_5_width_65k_l0_medium/config.json index 75a7c327505194ea035f1b23f0dafb3385be7bf7..076f50560405e52cd3a625b4fe4e049464e6ad70 100644 --- a/resid_post/layer_5_width_65k_l0_medium/config.json +++ b/resid_post/layer_5_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_small/config.json b/resid_post/layer_5_width_65k_l0_small/config.json index bafe2fd212007b2e2e40c9669a186fe2a6bf2943..0a3e5e83e724624d840c4ae9f294210a6a9620db 100644 --- a/resid_post/layer_5_width_65k_l0_small/config.json +++ b/resid_post/layer_5_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_big/config.json b/resid_post/layer_9_width_16k_l0_big/config.json index 510f955d6bc6a71d115959026870bd9c378ceec9..f4d1c5613603d0f243b0dd1ebb68c997df8c4737 100644 --- a/resid_post/layer_9_width_16k_l0_big/config.json +++ b/resid_post/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_medium/config.json b/resid_post/layer_9_width_16k_l0_medium/config.json index bfc4c337a6efa57f50fcea1ca9b538123968e693..1cb57fbe17d6eccc25e4fb057aea0e4fc754ba97 100644 --- a/resid_post/layer_9_width_16k_l0_medium/config.json +++ b/resid_post/layer_9_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_small/config.json b/resid_post/layer_9_width_16k_l0_small/config.json index a4efe4128987bc9fc59773bc3055605c306e3dc1..3f977e21583beb5a57ed713d570cf9de403b35e5 100644 --- a/resid_post/layer_9_width_16k_l0_small/config.json +++ b/resid_post/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 16384, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_big/config.json b/resid_post/layer_9_width_1m_l0_big/config.json index 1908e16649cf202d94531d45eaa22b38f43f0c21..46d1e2342606ca1db44c2261b8154adc1c6f3e66 100644 --- a/resid_post/layer_9_width_1m_l0_big/config.json +++ b/resid_post/layer_9_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_medium/config.json b/resid_post/layer_9_width_1m_l0_medium/config.json index fa9c14d4535e9ad1686a31a363125a4de7edb3bb..0b20f49ed46c82ac91b89969f2c703abcbf1c303 100644 --- a/resid_post/layer_9_width_1m_l0_medium/config.json +++ b/resid_post/layer_9_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_small/config.json b/resid_post/layer_9_width_1m_l0_small/config.json index cbafe20704dbddeeeede6c3fb717c5c62b2c0136..cd4fc34c9ae15d0ad0891390e37b5fbcab97cd2a 100644 --- a/resid_post/layer_9_width_1m_l0_small/config.json +++ b/resid_post/layer_9_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_big/config.json b/resid_post/layer_9_width_262k_l0_big/config.json index 28d0c5bac5e4e91df0e72d4a40e3679c13e35590..d6c409852eecd3451b39747cc114adde8b28aabd 100644 --- a/resid_post/layer_9_width_262k_l0_big/config.json +++ b/resid_post/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium/config.json b/resid_post/layer_9_width_262k_l0_medium/config.json index 54205d2df209dbdda8a755e8e3e29970d8f62b5d..a82b07453918c73a397e86710a296b352cd6ae1e 100644 --- a/resid_post/layer_9_width_262k_l0_medium/config.json +++ b/resid_post/layer_9_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json index 54205d2df209dbdda8a755e8e3e29970d8f62b5d..a82b07453918c73a397e86710a296b352cd6ae1e 100644 --- a/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_small/config.json b/resid_post/layer_9_width_262k_l0_small/config.json index faf2dc7cba6219565c0a30d5bd203411b2117486..8c7d0458aa65911901715dc72978a15a9219c541 100644 --- a/resid_post/layer_9_width_262k_l0_small/config.json +++ b/resid_post/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_big/config.json b/resid_post/layer_9_width_65k_l0_big/config.json index 66f89cda61cd32507c7cf79320bf00d202b443d1..3f168a2bbb3a56a9929700efb17a8b04a88a6d0d 100644 --- a/resid_post/layer_9_width_65k_l0_big/config.json +++ b/resid_post/layer_9_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_medium/config.json b/resid_post/layer_9_width_65k_l0_medium/config.json index 909375d6bcbcd58529d78a74fa78b2c708342e26..1bf4156c0faca7f50985f9be1951570e95005236 100644 --- a/resid_post/layer_9_width_65k_l0_medium/config.json +++ b/resid_post/layer_9_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_small/config.json b/resid_post/layer_9_width_65k_l0_small/config.json index 3a96cc0fb63e55551b776e11357af073cc462e20..be401efdf04b7f257a1fb46b865e1db18a51fd0f 100644 --- a/resid_post/layer_9_width_65k_l0_small/config.json +++ b/resid_post/layer_9_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-pt", + "model_name": "google/gemma-3-270m-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file