diff --git a/transcoder_all/layer_0_width_262k_l0_small_affine/config.json b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json index 841508ec9efcec015450a3c98d5fb673207733f6..6b6e70c5a7bdb82099cb4ce91633b2937d7629ca 100644 --- a/transcoder_all/layer_0_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small_affine/config.json b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json index 2f091317431f4224874d2b8088a9f8098c87e371..b2b11556af98f707f792f208a98dc0ec79d80302 100644 --- a/transcoder_all/layer_10_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_big_affine/config.json b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json index fc43163c18c4f7c79ffc5b28c411b75c31404aac..160b83728aa9cfb049c2fc67b2699f7156edc4f0 100644 --- a/transcoder_all/layer_11_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 91, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_small_affine/config.json b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json index 763aaede0d21037007618d08b42789077267ec23..eb09e4ee7dfb403b46d596d09cd76b8f54d35c73 100644 --- a/transcoder_all/layer_12_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small/config.json b/transcoder_all/layer_13_width_262k_l0_small/config.json index da1b57c3117d6770144040a80d6a0bd2c3faeed1..c6de71c6efa39c99074902dddcf4ae55de08639e 100644 --- a/transcoder_all/layer_13_width_262k_l0_small/config.json +++ b/transcoder_all/layer_13_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_big/config.json b/transcoder_all/layer_18_width_16k_l0_big/config.json index d539c3849aa9509a8a1c8f98d21b66380f7da2ee..a2061bad6a6574f2ceca28704cc3f387ce4bb091 100644 --- a/transcoder_all/layer_18_width_16k_l0_big/config.json +++ b/transcoder_all/layer_18_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 112, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_small/config.json b/transcoder_all/layer_18_width_16k_l0_small/config.json index b3be8050e89273c25cc60ae0a613384c60972a37..bf5d92b53454a49b4a7497bdd14e4b49621de524 100644 --- a/transcoder_all/layer_18_width_16k_l0_small/config.json +++ b/transcoder_all/layer_18_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_big_affine/config.json b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json index abd38826264ebbad1d3870b09fdadc14c8dc0699..ffc89afc268a4dcff67a224b681bbae943113a1d 100644 --- a/transcoder_all/layer_1_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 62, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_big/config.json b/transcoder_all/layer_1_width_262k_l0_big/config.json index 29f51e69ea806a8e0d78ba192195ff33992eb501..0cb3117c674f01c265322a5f0e25ec0c1d0db38e 100644 --- a/transcoder_all/layer_1_width_262k_l0_big/config.json +++ b/transcoder_all/layer_1_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 62, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_small_affine/config.json b/transcoder_all/layer_20_width_262k_l0_small_affine/config.json index 68b6991d9b68f6df189399ad0c6d0071ed928e5d..d156ab2ea76887cc0be40ca2c5351790429ec0b4 100644 --- a/transcoder_all/layer_20_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_20_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_big/config.json b/transcoder_all/layer_21_width_16k_l0_big/config.json index 7bdf90cfd66e403e905156cc8f8bfadfd1cb6689..42fa893c7e91b61c840fb7586cb132a088fb2cfa 100644 --- a/transcoder_all/layer_21_width_16k_l0_big/config.json +++ b/transcoder_all/layer_21_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_big/config.json b/transcoder_all/layer_21_width_262k_l0_big/config.json index b2cf797de0a7ede67850ffe1145bc1958fd95dfc..0d6c08fc7c37342c91f578e9811a1b18a6d2e823 100644 --- a/transcoder_all/layer_21_width_262k_l0_big/config.json +++ b/transcoder_all/layer_21_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_small/config.json b/transcoder_all/layer_23_width_262k_l0_small/config.json index 4fce90afd152b76409a261658149e0e84aaef505..772daa15f1886a6e3761c04caa16318b99b2dc6b 100644 --- a/transcoder_all/layer_23_width_262k_l0_small/config.json +++ b/transcoder_all/layer_23_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_small_affine/config.json b/transcoder_all/layer_24_width_16k_l0_small_affine/config.json index dc1e1bf493efa267eed0558355ab2e2ea71e793f..298854adda0915f642bcbd1fb221119124d20f65 100644 --- a/transcoder_all/layer_24_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_24_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_big_affine/config.json b/transcoder_all/layer_25_width_16k_l0_big_affine/config.json index d9bf7a63482bdf245eaeff84f0ac5a5d0139a722..c1bf65363bd3727a0e79d015df43841f0dcd396c 100644 --- a/transcoder_all/layer_25_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_25_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small/config.json b/transcoder_all/layer_25_width_16k_l0_small/config.json index 4fcd36725b72bb8ef7c42ad6595bb377f24b7fe8..17f4b5bc6659217f0ccb1626a2b5f579ddcf3c2f 100644 --- a/transcoder_all/layer_25_width_16k_l0_small/config.json +++ b/transcoder_all/layer_25_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_262k_l0_big_affine/config.json b/transcoder_all/layer_26_width_262k_l0_big_affine/config.json index 5daa7ebff1b9af300ce23ae65d69d5ee2cea8401..8d03a16e405b9b2ddfce6d2f7b4a974fa0a40d61 100644 --- a/transcoder_all/layer_26_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_26_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_262k_l0_small/config.json b/transcoder_all/layer_30_width_262k_l0_small/config.json index dc9be8a47aa5f66d9a855127c1fa000a3ee5871b..b0b9fd0a84ae59b7907f059daa3c6be012c7a92f 100644 --- a/transcoder_all/layer_30_width_262k_l0_small/config.json +++ b/transcoder_all/layer_30_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_big/config.json b/transcoder_all/layer_31_width_262k_l0_big/config.json index 873821cf836ba080c09085ec1feaf833c2f3b3cc..326f2d9fe6f71ea8486edcd4757de6d30fe32292 100644 --- a/transcoder_all/layer_31_width_262k_l0_big/config.json +++ b/transcoder_all/layer_31_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_small/config.json b/transcoder_all/layer_31_width_262k_l0_small/config.json index 7a29d4ef7f68a7797de44b4106492d753f2732ed..137b5e414cb2c3da9dc905e676a62926071dbeee 100644 --- a/transcoder_all/layer_31_width_262k_l0_small/config.json +++ b/transcoder_all/layer_31_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_small_affine/config.json b/transcoder_all/layer_31_width_262k_l0_small_affine/config.json index fe7047b6862c4bda85f8775ed464104b6114bce6..3b6ab3d5d59fdb22ddc8e638899943bce0432e5d 100644 --- a/transcoder_all/layer_31_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_31_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_16k_l0_big/config.json b/transcoder_all/layer_33_width_16k_l0_big/config.json index 7a29543ca7ef5b186e09423262892ca7fffa2c17..db8d8679c81c67b0ac5daca620534dc182436c18 100644 --- a/transcoder_all/layer_33_width_16k_l0_big/config.json +++ b/transcoder_all/layer_33_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_16k_l0_big_affine/config.json b/transcoder_all/layer_33_width_16k_l0_big_affine/config.json index 25321b48306e8b0b8eea5d3f7f4e0e3d092489cd..4a94d1ec1a4a7a3d243b36a6082586509552966b 100644 --- a/transcoder_all/layer_33_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_33_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_16k_l0_big/config.json b/transcoder_all/layer_34_width_16k_l0_big/config.json index 510f57db3a2c5312b4e9c0ef223d84ca0d9db809..efeb813129c0de0d96b934ad1a0bba84cb1f4ca2 100644 --- a/transcoder_all/layer_34_width_16k_l0_big/config.json +++ b/transcoder_all/layer_34_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_16k_l0_small/config.json b/transcoder_all/layer_35_width_16k_l0_small/config.json index c7e164c07091c527f2c00e9a3722af67e6b23901..50532f0115ace50209fa046b21d0262ec6f40dea 100644 --- a/transcoder_all/layer_35_width_16k_l0_small/config.json +++ b/transcoder_all/layer_35_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_262k_l0_small/config.json b/transcoder_all/layer_35_width_262k_l0_small/config.json index 807425c6d8b2d31b7586f5ddf44852166164444e..60cd9a9178a4f7eaf8d8713c82b7506bdadba17e 100644 --- a/transcoder_all/layer_35_width_262k_l0_small/config.json +++ b/transcoder_all/layer_35_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_262k_l0_small/config.json b/transcoder_all/layer_37_width_262k_l0_small/config.json index b74fc9280b6ff8a601844beeabb6c1ce92082210..bf4f7d33e3c2077d1dd03d33a1ed389ef6217633 100644 --- a/transcoder_all/layer_37_width_262k_l0_small/config.json +++ b/transcoder_all/layer_37_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_16k_l0_big_affine/config.json b/transcoder_all/layer_38_width_16k_l0_big_affine/config.json index 75ac74505a4e34e4f16ee23312f47deea7ff7c70..520eaa9e457f8e8d639fe4939ff56f31acdd0ab9 100644 --- a/transcoder_all/layer_38_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_38_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_small/config.json b/transcoder_all/layer_38_width_262k_l0_small/config.json index 155ac8ca6edadaeb00e63d2ac9c2944ac77fc0a5..5aff82afa77164db6b4da3084dcdb8144f11a9af 100644 --- a/transcoder_all/layer_38_width_262k_l0_small/config.json +++ b/transcoder_all/layer_38_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_16k_l0_small_affine/config.json b/transcoder_all/layer_39_width_16k_l0_small_affine/config.json index c0249aedf527a182cac7d619930ecdb7e4f93926..93e874ebe32bb8032a827cf4d5c9bc6ae5e5218a 100644 --- a/transcoder_all/layer_39_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_39_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big_affine/config.json b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json index 965a20eaa1b20212b7a31aeb08f29e0ea3b0182a..a923e2211bdf9a86ba375db32da5e3601cf36d54 100644 --- a/transcoder_all/layer_3_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 68, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small/config.json b/transcoder_all/layer_3_width_262k_l0_small/config.json index 18e11748f0ccef83bda28684787a08a9fc833724..068486e3e91d9ea7bedf98abd86cfd5df7dce196 100644 --- a/transcoder_all/layer_3_width_262k_l0_small/config.json +++ b/transcoder_all/layer_3_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_262k_l0_big_affine/config.json b/transcoder_all/layer_42_width_262k_l0_big_affine/config.json index cd65cee712cefc12c63f70bb245cf4072aff3123..7233cd4ff90425fd0ea82570a2a7a79e99ce10a7 100644 --- a/transcoder_all/layer_42_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_42_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_16k_l0_big/config.json b/transcoder_all/layer_44_width_16k_l0_big/config.json index c0d24abcb91a931eb04c58a451b0e6796de5ff75..825511742f2a081db2922909e9dc3be8c3e7888e 100644 --- a/transcoder_all/layer_44_width_16k_l0_big/config.json +++ b/transcoder_all/layer_44_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_16k_l0_small_affine/config.json b/transcoder_all/layer_45_width_16k_l0_small_affine/config.json index f59a1902485e763251ee05ded24cc6f5ef28d065..521d22bb95075111c62777581337ade852b5dc57 100644 --- a/transcoder_all/layer_45_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_45_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_262k_l0_big/config.json b/transcoder_all/layer_45_width_262k_l0_big/config.json index d3e61551f1f38b12d169f070b0070fb8e8968258..6c1634f132a411c56d28b4b88336dc88a88fd7bd 100644 --- a/transcoder_all/layer_45_width_262k_l0_big/config.json +++ b/transcoder_all/layer_45_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_262k_l0_small/config.json b/transcoder_all/layer_45_width_262k_l0_small/config.json index 432892b3acd0971007db59d140f32e435b22a315..160cdb54377b83732d7faf254396d90b042d7648 100644 --- a/transcoder_all/layer_45_width_262k_l0_small/config.json +++ b/transcoder_all/layer_45_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_262k_l0_small_affine/config.json b/transcoder_all/layer_45_width_262k_l0_small_affine/config.json index 95ae350c8d7b4307d65a506d62c2e99f6e6e6b9d..22aa5e924fe22f943897b3d1af31461e4c008642 100644 --- a/transcoder_all/layer_45_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_45_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_big_affine/config.json b/transcoder_all/layer_48_width_16k_l0_big_affine/config.json index d66b304052cd122aa27ac29ae44579c39d9a9656..5ecd757994a1ea03fc443b2b41f9d95d515717ba 100644 --- a/transcoder_all/layer_48_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_48_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_16k_l0_big/config.json b/transcoder_all/layer_50_width_16k_l0_big/config.json index 6553e6fbeec35b22a62682a417391e386760b178..fca3ccd0ba7ea1eeb41087b90e673d6e49e6162a 100644 --- a/transcoder_all/layer_50_width_16k_l0_big/config.json +++ b/transcoder_all/layer_50_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_51_width_16k_l0_big/config.json b/transcoder_all/layer_51_width_16k_l0_big/config.json index adbfda7287c9188819a192322139f4db20ef1c7f..89caf2e81a52a672369bce7aa05901ab6082d87d 100644 --- a/transcoder_all/layer_51_width_16k_l0_big/config.json +++ b/transcoder_all/layer_51_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.51.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_16k_l0_big/config.json b/transcoder_all/layer_53_width_16k_l0_big/config.json index 7bc5d8c02e68a5258e4a5604fd2c4bc289ca1b34..9b66832859e5e1c5908a5491c00be0899fc3860f 100644 --- a/transcoder_all/layer_53_width_16k_l0_big/config.json +++ b/transcoder_all/layer_53_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_262k_l0_big/config.json b/transcoder_all/layer_53_width_262k_l0_big/config.json index 58a5fd8d41e441aaa7072987884e130859309b8e..7e172deaf19858726c0b21f926c96498994a1a04 100644 --- a/transcoder_all/layer_53_width_262k_l0_big/config.json +++ b/transcoder_all/layer_53_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_16k_l0_big/config.json b/transcoder_all/layer_54_width_16k_l0_big/config.json index 674a279894edba15d78d7722cda862b930eb5268..6d7b97c121cfb27aa8bc747e8f683d07ea436e7f 100644 --- a/transcoder_all/layer_54_width_16k_l0_big/config.json +++ b/transcoder_all/layer_54_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_16k_l0_small_affine/config.json b/transcoder_all/layer_54_width_16k_l0_small_affine/config.json index a8b35247745429a8f59f7dcd5d260afebd7ac56b..ab4f80110594d24745b0a5219ae5bbb5506eec3d 100644 --- a/transcoder_all/layer_54_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_54_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_big_affine/config.json b/transcoder_all/layer_56_width_262k_l0_big_affine/config.json index 8eea656736dbb70804a4e42e47e62e9c9091b8c7..14f92679ee18ffa0e757f529001e89bc03e57897 100644 --- a/transcoder_all/layer_56_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_56_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_262k_l0_small/config.json b/transcoder_all/layer_57_width_262k_l0_small/config.json index 002954b92d845eb853f19af370a71189a66a1e54..c4f3dae2c1fddfa0111884e0d17252ad33cbbac6 100644 --- a/transcoder_all/layer_57_width_262k_l0_small/config.json +++ b/transcoder_all/layer_57_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_16k_l0_small/config.json b/transcoder_all/layer_58_width_16k_l0_small/config.json index b670fcad87fe8ee874cbd6f1cb54eafe2947cb75..b0fbee3482853b8608b4659b92a0916eec731c83 100644 --- a/transcoder_all/layer_58_width_16k_l0_small/config.json +++ b/transcoder_all/layer_58_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_16k_l0_small_affine/config.json b/transcoder_all/layer_58_width_16k_l0_small_affine/config.json index df52ce7e048d254f736f48211cad08104f5dcaec..ad9a343ebe76f8948b64bf5aabaf6b5273dcb988 100644 --- a/transcoder_all/layer_58_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_58_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_262k_l0_big/config.json b/transcoder_all/layer_58_width_262k_l0_big/config.json index 51b5a50d76c73a9a0c345ba572f0f82861ed5a99..89083c23ea28e8b25411974f4b360765f0e33162 100644 --- a/transcoder_all/layer_58_width_262k_l0_big/config.json +++ b/transcoder_all/layer_58_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_16k_l0_small/config.json b/transcoder_all/layer_59_width_16k_l0_small/config.json index 59d470c8a10dbc17acc41a8873a6947fb1789124..8b078420359f3e2d5030106afa0410995bc71629 100644 --- a/transcoder_all/layer_59_width_16k_l0_small/config.json +++ b/transcoder_all/layer_59_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_262k_l0_small/config.json b/transcoder_all/layer_60_width_262k_l0_small/config.json index da90b66e08c95b8ef9bec823657b83d35568cbdb..33d4b2835563fa81c3e4e3181745f823e88fe090 100644 --- a/transcoder_all/layer_60_width_262k_l0_small/config.json +++ b/transcoder_all/layer_60_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_16k_l0_big/config.json b/transcoder_all/layer_61_width_16k_l0_big/config.json index 7ead37cda063462a77e1c10c73f8078718f5a195..1142e067c3653c5173b920477dee57f22390e259 100644 --- a/transcoder_all/layer_61_width_16k_l0_big/config.json +++ b/transcoder_all/layer_61_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_small/config.json b/transcoder_all/layer_8_width_16k_l0_small/config.json index a9e23dd965add17a9e54380c8cf67229a759167f..b67338c3426c5177144af8f2f19da7b1a218a2bf 100644 --- a/transcoder_all/layer_8_width_16k_l0_small/config.json +++ b/transcoder_all/layer_8_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_small_affine/config.json b/transcoder_all/layer_8_width_16k_l0_small_affine/config.json index 7d03c090691897cb2f37ee56f6c22934c9b01bdd..12df91f782969cd412087e2e9c52c81497ad43ca 100644 --- a/transcoder_all/layer_8_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_8_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file