diff --git a/transcoder_all/layer_0_width_16k_l0_small_affine/config.json b/transcoder_all/layer_0_width_16k_l0_small_affine/config.json index 597175b40ec1305bf40a95c9bba3f8e935b00235..0168cf850794bc723b46873d7e999a0455a735e2 100644 --- a/transcoder_all/layer_0_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_0_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json index 02463cd6cf86adf4647657d0e715d314f56ba491..71fb4034dc72e6bfc8cdc8440f4a781b06f40ee1 100644 --- a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 89, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_big_affine/config.json b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json index 57ab0e73540536368f2f81a324bcabd47bfa9d8c..82b253c2a25acf6dce5001860eca94f9b848164e 100644 --- a/transcoder_all/layer_12_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 94, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_small/config.json b/transcoder_all/layer_14_width_262k_l0_small/config.json index 31d6f3704627455df5e15a4e671e0efd279468bf..2299de3fe75c75bd99c89f0a133082a0aa46bfd3 100644 --- a/transcoder_all/layer_14_width_262k_l0_small/config.json +++ b/transcoder_all/layer_14_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_small/config.json b/transcoder_all/layer_15_width_262k_l0_small/config.json index 1c0fc792b3f15541bfe46772d3127c4fc0fda717..2d9dcfa2c400a9a6209cb8988d8fbac3a1581651 100644 --- a/transcoder_all/layer_15_width_262k_l0_small/config.json +++ b/transcoder_all/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_small_affine/config.json b/transcoder_all/layer_18_width_16k_l0_small_affine/config.json index c4706d602da548489ed6961f7918d4ce08d7587a..531dd9645958258728d51c06de926bec292d610e 100644 --- a/transcoder_all/layer_18_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_18_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json index 8e5b4a04d304d8c39a87b8262414bda22a735e06..43086c34ef5468c9627571e6035c48a5ceaf38f9 100644 --- a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_small/config.json b/transcoder_all/layer_21_width_262k_l0_small/config.json index 0918832f9e1bc8aef61182ad1bb9271c3cca2dc3..6c915e25be0174933a14a172182fcf537a5570fd 100644 --- a/transcoder_all/layer_21_width_262k_l0_small/config.json +++ b/transcoder_all/layer_21_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big_affine/config.json b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json index 2160e193f59c42a3bc073787d3db234b923b3365..cff71e301b30c624367cc5e4bcdca476dbf3d3a4 100644 --- a/transcoder_all/layer_22_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_big_affine/config.json b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json index 928e943bd31cd8e86108ac08c6d22ff132df8188..9734eb68f9bd14ab53b2817c92e54bfc729fd224 100644 --- a/transcoder_all/layer_22_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_big/config.json b/transcoder_all/layer_23_width_262k_l0_big/config.json index 6c1bd8689bb6f45682d9e0e7cdb67aa0680f28b7..5649675142b4da8095a8db9f0a9f296c49fe9448 100644 --- a/transcoder_all/layer_23_width_262k_l0_big/config.json +++ b/transcoder_all/layer_23_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_small_affine/config.json b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json index 95b09423ed585648a0e769b7c288c7596af4ad1c..95e77778c5fa3fec495b6d04f9f6b064247d25fc 100644 --- a/transcoder_all/layer_24_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_big_affine/config.json b/transcoder_all/layer_25_width_262k_l0_big_affine/config.json index da9b132ac6e730d535fd9a040efc4e9c5c2cdfa9..70fab760f0d753fd3e0e4cff719eea1d8537789d 100644 --- a/transcoder_all/layer_25_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_25_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_big/config.json b/transcoder_all/layer_26_width_16k_l0_big/config.json index e11538a3675adca6b3a244b6eef81fff433bdf04..76c4049398ce90904b2f4a605505102235dfc024 100644 --- a/transcoder_all/layer_26_width_16k_l0_big/config.json +++ b/transcoder_all/layer_26_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_small/config.json b/transcoder_all/layer_27_width_262k_l0_small/config.json index 547037259cdf9cd10ae093aabdbcbf697608ccb6..784e17e60d7267a71eb1f89b29b67a70a9cc6e95 100644 --- a/transcoder_all/layer_27_width_262k_l0_small/config.json +++ b/transcoder_all/layer_27_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_16k_l0_small_affine/config.json b/transcoder_all/layer_28_width_16k_l0_small_affine/config.json index 14da97f7e72ac1f086d0a0522a0a44be3b9086ce..5c7d904f6f5e6b3685f23ec7c809806110235738 100644 --- a/transcoder_all/layer_28_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_28_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_262k_l0_big/config.json b/transcoder_all/layer_28_width_262k_l0_big/config.json index f82fadbaca3ed99dce8069fd51f156e19137bd38..9678848034186c6aa5c78d0c7224dcabea5d7f07 100644 --- a/transcoder_all/layer_28_width_262k_l0_big/config.json +++ b/transcoder_all/layer_28_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_big_affine/config.json b/transcoder_all/layer_29_width_16k_l0_big_affine/config.json index 1de343538cf4e4f7ba024383da44def0d6ba62f0..ca88c80055fe69be945afaa12e63e06c6ceac22a 100644 --- a/transcoder_all/layer_29_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_29_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big/config.json b/transcoder_all/layer_2_width_16k_l0_big/config.json index 5a07f279055c41f4ceae01dd230bda1fc5d72f5a..bd0de008845f8252689c032fc79d77f6fa5d9b36 100644 --- a/transcoder_all/layer_2_width_16k_l0_big/config.json +++ b/transcoder_all/layer_2_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 65, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small_affine/config.json b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json index b3ed3faa845a2d6520042604752076af390851d4..b14d66ed4498bab039770217b38fed884a530705 100644 --- a/transcoder_all/layer_2_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_16k_l0_big_affine/config.json b/transcoder_all/layer_31_width_16k_l0_big_affine/config.json index ef5c7a0cab97ce1f1327d1703555147437d9f342..79e73adaeff07d9742442d083484c6a9ffa9cfe8 100644 --- a/transcoder_all/layer_31_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_31_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_16k_l0_small/config.json b/transcoder_all/layer_31_width_16k_l0_small/config.json index def1f209b4138eed98d5c84f6ee4da79498a94cf..635f4c81f66470142c151751320aa436ec60cb39 100644 --- a/transcoder_all/layer_31_width_16k_l0_small/config.json +++ b/transcoder_all/layer_31_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_16k_l0_small_affine/config.json b/transcoder_all/layer_31_width_16k_l0_small_affine/config.json index 819afbb625ce0a2f16d96710e46d50d77b14ef0f..4ac6e640b4335b1b149222f52b782ad8209eb63a 100644 --- a/transcoder_all/layer_31_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_31_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_16k_l0_big_affine/config.json b/transcoder_all/layer_32_width_16k_l0_big_affine/config.json index 5635b70a2c0312c84f10c3c92fe03a5148e3e705..7be461088bbeb82d4c71a91f3599ff42d89c7a85 100644 --- a/transcoder_all/layer_32_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_32_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_262k_l0_big/config.json b/transcoder_all/layer_32_width_262k_l0_big/config.json index cdd3897b7f31987ef195b4ce6f59ed4ed60ed1a5..cde1c433590bb13c98c92afd29fc0820e15b6474 100644 --- a/transcoder_all/layer_32_width_262k_l0_big/config.json +++ b/transcoder_all/layer_32_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_big_affine/config.json b/transcoder_all/layer_33_width_262k_l0_big_affine/config.json index fc1a2fd217b540bb11935c506f6e3636d92e07af..be6d55ba959f66a4cde03d96b916f5c586af6cce 100644 --- a/transcoder_all/layer_33_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_33_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_262k_l0_small_affine/config.json b/transcoder_all/layer_34_width_262k_l0_small_affine/config.json index 9cb7c40d03992ba649374aa616daeccb416034e6..d30b7e3228c5cd18b44d19873b7a6690872f931b 100644 --- a/transcoder_all/layer_34_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_34_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_16k_l0_big_affine/config.json b/transcoder_all/layer_36_width_16k_l0_big_affine/config.json index 0ab7c66d12ed1669ad75d326e2331e133e9fe1ae..5f2b99ce25802563b45cab3511ea57f96c29c306 100644 --- a/transcoder_all/layer_36_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_36_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_262k_l0_small_affine/config.json b/transcoder_all/layer_36_width_262k_l0_small_affine/config.json index 82e22fb281187903da6e637c636b28d73a3cbffa..e60675d186b43222ff416def5ee53c03eb529b7c 100644 --- a/transcoder_all/layer_36_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_36_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_16k_l0_small_affine/config.json b/transcoder_all/layer_38_width_16k_l0_small_affine/config.json index 692e70466aff6d6566cf4d2f66a9f792dff57fe9..b83fa3a27867a0fd76a0314470c604c0a7744af9 100644 --- a/transcoder_all/layer_38_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_38_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_big_affine/config.json b/transcoder_all/layer_38_width_262k_l0_big_affine/config.json index 3bdec10b8016515a487315c0e71f99a472695eff..b26a2fef5c7fd999323171b422fd61b1056a7a11 100644 --- a/transcoder_all/layer_38_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_38_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small/config.json b/transcoder_all/layer_3_width_16k_l0_small/config.json index ab700217b2e686ba0a23d7cbaaf39b5ecc87aafa..1eda771bcddc68c66b914b7a89e12d092ae699c9 100644 --- a/transcoder_all/layer_3_width_16k_l0_small/config.json +++ b/transcoder_all/layer_3_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_262k_l0_small/config.json b/transcoder_all/layer_42_width_262k_l0_small/config.json index 836eeb432c90c912bf994ad70e363460742cedb7..1882e0bd95c75aa6795aa85db96db606b8d6a946 100644 --- a/transcoder_all/layer_42_width_262k_l0_small/config.json +++ b/transcoder_all/layer_42_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_262k_l0_small_affine/config.json b/transcoder_all/layer_42_width_262k_l0_small_affine/config.json index 8823f87774fcb21cb19e80ab221d0cddb653b6db..fb1ed9f49e642187e627e08eb7d7e8a7f3e38cc5 100644 --- a/transcoder_all/layer_42_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_42_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_262k_l0_small/config.json b/transcoder_all/layer_43_width_262k_l0_small/config.json index 06b15398b5bc8e2fe9fceab2ec9ace9e1ef3d450..66cfe07169e30d7f61984a31345f2554d7a6d11e 100644 --- a/transcoder_all/layer_43_width_262k_l0_small/config.json +++ b/transcoder_all/layer_43_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_16k_l0_small/config.json b/transcoder_all/layer_44_width_16k_l0_small/config.json index 5aa646851af06afae109c485d3dad5087503e811..50cd6fa69e6742b2239eb5006b22a5ce5be6c7c1 100644 --- a/transcoder_all/layer_44_width_16k_l0_small/config.json +++ b/transcoder_all/layer_44_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_16k_l0_big/config.json b/transcoder_all/layer_45_width_16k_l0_big/config.json index 70ca6e3f832ac1b6e6682ac965204730aa15a7b8..d42bfbd1841c9fea75b64e7b673251519c113ed4 100644 --- a/transcoder_all/layer_45_width_16k_l0_big/config.json +++ b/transcoder_all/layer_45_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_46_width_16k_l0_small/config.json b/transcoder_all/layer_46_width_16k_l0_small/config.json index 55e6eb9b6ec828ca1b59b3664df918704938b0fa..d875099c512926cf1e03a5b8502d42b49b4fcd63 100644 --- a/transcoder_all/layer_46_width_16k_l0_small/config.json +++ b/transcoder_all/layer_46_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.46.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_16k_l0_big/config.json b/transcoder_all/layer_47_width_16k_l0_big/config.json index 58ae7403ec2115943df05b57bd205344014ea33f..40b4234c4dce80a74e5175069847514bfe9da270 100644 --- a/transcoder_all/layer_47_width_16k_l0_big/config.json +++ b/transcoder_all/layer_47_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_16k_l0_small/config.json b/transcoder_all/layer_47_width_16k_l0_small/config.json index b31eaa1c1a4dd9ec210b27248997651969cc362d..807414f65eebaef6cfeedc633a1f5986ba2fbeba 100644 --- a/transcoder_all/layer_47_width_16k_l0_small/config.json +++ b/transcoder_all/layer_47_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_small/config.json b/transcoder_all/layer_48_width_16k_l0_small/config.json index 891e1789b9ea200d02fc3048116f568eb6aace18..8a868e0d7460a997f947340d4cfe4003ce7752e0 100644 --- a/transcoder_all/layer_48_width_16k_l0_small/config.json +++ b/transcoder_all/layer_48_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_262k_l0_small/config.json b/transcoder_all/layer_48_width_262k_l0_small/config.json index 2fb877defd300b056ca8a69790156903c564f58b..3e175ee4c0722e42f4d3708115d389396954d2f6 100644 --- a/transcoder_all/layer_48_width_262k_l0_small/config.json +++ b/transcoder_all/layer_48_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_262k_l0_small_affine/config.json b/transcoder_all/layer_48_width_262k_l0_small_affine/config.json index b31f869479880469f39808b8c14e6d1c94995de4..afbe9f58df7ecc59d6c0d0813381846acf339cef 100644 --- a/transcoder_all/layer_48_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_48_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_262k_l0_big/config.json b/transcoder_all/layer_49_width_262k_l0_big/config.json index 7cffe03f72b108b937889c479954e99f10c690b1..46e18a0db1c825710ca8c22fa9588387d81ddb64 100644 --- a/transcoder_all/layer_49_width_262k_l0_big/config.json +++ b/transcoder_all/layer_49_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_262k_l0_small/config.json b/transcoder_all/layer_49_width_262k_l0_small/config.json index 311e56f9f7d726bb70a8b947aff26f45e4ce3429..76d93fff1f6689b30b7d7ff8ec09932d620c6f1a 100644 --- a/transcoder_all/layer_49_width_262k_l0_small/config.json +++ b/transcoder_all/layer_49_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_big/config.json b/transcoder_all/layer_4_width_262k_l0_big/config.json index 01338ab001a86a1062f3c6d009b3e319eea652a9..934e0473c8405ada7992ba940d88325a860cde94 100644 --- a/transcoder_all/layer_4_width_262k_l0_big/config.json +++ b/transcoder_all/layer_4_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 71, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_16k_l0_small/config.json b/transcoder_all/layer_50_width_16k_l0_small/config.json index 40bc1665832593b2a3128b0e0e2ae2f2d4d96320..ff3e1865b87ae598ddab9aecdda816ebdece2219 100644 --- a/transcoder_all/layer_50_width_16k_l0_small/config.json +++ b/transcoder_all/layer_50_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_51_width_16k_l0_small_affine/config.json b/transcoder_all/layer_51_width_16k_l0_small_affine/config.json index 72eabc277195c47b21387ec68ab1e2c81dc692c6..0c9433c298932a8244028654e18c5107d8e997f7 100644 --- a/transcoder_all/layer_51_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_51_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.51.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_262k_l0_big_affine/config.json b/transcoder_all/layer_58_width_262k_l0_big_affine/config.json index 3be9b6360e26f6b956f05c3dac8f5ea4cc92566c..42e87d8bb72701f7a07d6a3d082f8bf81219bfa9 100644 --- a/transcoder_all/layer_58_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_58_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_16k_l0_small_affine/config.json b/transcoder_all/layer_59_width_16k_l0_small_affine/config.json index bace170feb7be5bf9568083a1aee56869bd3c757..cbeb0ac61c090e7044aecfc4e8802e42a8dc7047 100644 --- a/transcoder_all/layer_59_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_59_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_262k_l0_big_affine/config.json b/transcoder_all/layer_59_width_262k_l0_big_affine/config.json index 1abcaf202bf6d80bc0ccec2a9ecdccd6acfd6a9b..8219a557ca201883164a2e549d43cd879a3d73be 100644 --- a/transcoder_all/layer_59_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_59_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_262k_l0_big/config.json b/transcoder_all/layer_61_width_262k_l0_big/config.json index 2a2c704f6bba165fff76c67efc972c4bd4b7cb98..d9be13539359df6d736c822a4e8df0e91c3ce24b 100644 --- a/transcoder_all/layer_61_width_262k_l0_big/config.json +++ b/transcoder_all/layer_61_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_big_affine/config.json b/transcoder_all/layer_6_width_16k_l0_big_affine/config.json index 9117871fa2ddcba218c8d1c72749ebe04523672d..afb6d6d72f9c5022678c455dabe02627f5d87e63 100644 --- a/transcoder_all/layer_6_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_6_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 77, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_small_affine/config.json b/transcoder_all/layer_6_width_262k_l0_small_affine/config.json index 3333730f02c861d190a999168f842c6d3cc2f39e..de365e4b57441dbcc3ad1d1a9255adddc5dadbbf 100644 --- a/transcoder_all/layer_6_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_6_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_small/config.json b/transcoder_all/layer_8_width_262k_l0_small/config.json index 193bd1a69fa955960fa3bd3c0d2cf3d6dd5dabe6..bf97b2cbddb46f8412b96b1b83a9ab5469296934 100644 --- a/transcoder_all/layer_8_width_262k_l0_small/config.json +++ b/transcoder_all/layer_8_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json index 1ef6c73e4ee28bfba9124bfa4e15340907a0eccc..1efdbf464f0488b46a9ffbdc969c3ce709e889bb 100644 --- a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file