diff --git a/transcoder_all/layer_0_width_16k_l0_big_affine/config.json b/transcoder_all/layer_0_width_16k_l0_big_affine/config.json index 0205b55428ee5195760eb43fa874e65f08aea5ce..0e736610beffeefd45250cfbd2a441cb1fb0db71 100644 --- a/transcoder_all/layer_0_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_0_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big/config.json b/transcoder_all/layer_0_width_262k_l0_big/config.json index c114078e2640aa0092c37437ac3358107a98b3f0..a6cbbb6acf536e86a4db649d4bb8157417242cde 100644 --- a/transcoder_all/layer_0_width_262k_l0_big/config.json +++ b/transcoder_all/layer_0_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big_affine/config.json b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json index 271aea24d305238732a834ab8a37e43cc6130510..0976f92c4efc1653e992bc2bd2cc0790b83f0dfc 100644 --- a/transcoder_all/layer_0_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small/config.json b/transcoder_all/layer_0_width_262k_l0_small/config.json index ae12160816ee17994c5849c0b228778d0cdd86bd..6edb05c9ce537819db556b53a9dc38ec00820286 100644 --- a/transcoder_all/layer_0_width_262k_l0_small/config.json +++ b/transcoder_all/layer_0_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_small_affine/config.json b/transcoder_all/layer_10_width_262k_l0_small_affine/config.json index b0729fcafb4126c3cecf2d52fc10ac38200a87b5..e5f78e739a59174fca3dbe06042e4a6e8dcd688f 100644 --- a/transcoder_all/layer_10_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_10_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big/config.json b/transcoder_all/layer_13_width_16k_l0_big/config.json index eb2c3e7ee4109d42f59724f5bdf15520e829d95b..3d1b1258a753c397cf29ebbebcef72fed1ae57de 100644 --- a/transcoder_all/layer_13_width_16k_l0_big/config.json +++ b/transcoder_all/layer_13_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 97, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small_affine/config.json b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json index b232c9167130840cb406205f7751e12f6252d3e4..70f028085c7393e2efad04cc9196cd03a1212019 100644 --- a/transcoder_all/layer_13_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big/config.json b/transcoder_all/layer_14_width_16k_l0_big/config.json index 7666fe00aa2a0e2c260493a8be6a885b6c207028..fd1ffa1d5a8bbb905b573da343d2db0135ae2352 100644 --- a/transcoder_all/layer_14_width_16k_l0_big/config.json +++ b/transcoder_all/layer_14_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_big/config.json b/transcoder_all/layer_14_width_262k_l0_big/config.json index cd8804727f1004932c952468fdc2a2e936114a15..a06620c9f6b3732767097fea5bfa3e1de7cb1d95 100644 --- a/transcoder_all/layer_14_width_262k_l0_big/config.json +++ b/transcoder_all/layer_14_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_small/config.json b/transcoder_all/layer_16_width_16k_l0_small/config.json index 75011f9f83ead85894d4db299bc3777140f9fd62..bbfb48d275f75c73a7d6e4ddbd68eaaa3dcb91e4 100644 --- a/transcoder_all/layer_16_width_16k_l0_small/config.json +++ b/transcoder_all/layer_16_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_small_affine/config.json b/transcoder_all/layer_16_width_16k_l0_small_affine/config.json index 672b7ced64071c089385f9aadf56ce2ab9f79bcf..c51441100d2c62d20f43f89d0cfbcd6f2274f676 100644 --- a/transcoder_all/layer_16_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_16_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_big/config.json b/transcoder_all/layer_16_width_262k_l0_big/config.json index 0d329a728035aeda921a8920c67429dbd8739ab4..97ed3e7b4c7705a3bf3c04d5de4dc943e38f7b5f 100644 --- a/transcoder_all/layer_16_width_262k_l0_big/config.json +++ b/transcoder_all/layer_16_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 106, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big/config.json b/transcoder_all/layer_17_width_16k_l0_big/config.json index b38462f43fded9bf35b00b0ff57fe4ea94a7232c..544d6f549e6b691296a50bd758df2ae5657ee098 100644 --- a/transcoder_all/layer_17_width_16k_l0_big/config.json +++ b/transcoder_all/layer_17_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 109, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_small_affine/config.json b/transcoder_all/layer_17_width_16k_l0_small_affine/config.json index 905b824bf2c125f3d6377e96ac1e6c8801108057..6274a76948e24c065ee310bb5a169ab153104c27 100644 --- a/transcoder_all/layer_17_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_17_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big_affine/config.json b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json index cb462c520f7fd2ae668c6d2daa72c12075a794c6..0b499afec3a040c43d37446d41d16229f373dc55 100644 --- a/transcoder_all/layer_17_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 109, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json index fe4a2725e0fb7a14e28af314c4b1343f2f635849..de8ed7991128371f17e2cb6536048edc29e45608 100644 --- a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_big_affine/config.json b/transcoder_all/layer_18_width_16k_l0_big_affine/config.json index dfe489ef498fa49dba3c4d2cb36542980f827381..3aff5e8be17289ffe013d720cdc5f178069aa2b5 100644 --- a/transcoder_all/layer_18_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_18_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 112, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_small/config.json b/transcoder_all/layer_19_width_16k_l0_small/config.json index a94dd113f4c8fd7d95550228971e931d0730e66a..6e028ec67bab3daab2474bb509cc7e9d6dbc1a74 100644 --- a/transcoder_all/layer_19_width_16k_l0_small/config.json +++ b/transcoder_all/layer_19_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_small/config.json b/transcoder_all/layer_20_width_16k_l0_small/config.json index fef455d0c69cc3c62176d5bbd10786dad4a31d1f..4e6af7a166d67c894d58c864e59c31774b2498c5 100644 --- a/transcoder_all/layer_20_width_16k_l0_small/config.json +++ b/transcoder_all/layer_20_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_small_affine/config.json b/transcoder_all/layer_20_width_16k_l0_small_affine/config.json index d25259c062b80176d0b3a23825c072b07252703a..626f0d714809fb43e9089959a0aeb88d7e7bbac0 100644 --- a/transcoder_all/layer_20_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_20_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_big_affine/config.json b/transcoder_all/layer_21_width_16k_l0_big_affine/config.json index 63ee04d2682cba757c809d3a2c0c1d6bb682ac5d..21af3b5707b5d55bc16883baa85e28b0b610b8eb 100644 --- a/transcoder_all/layer_21_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_21_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_small_affine/config.json b/transcoder_all/layer_21_width_16k_l0_small_affine/config.json index 64c347d2df78e203c8fa16d40bf96338d630c2f5..4e34bab7d704b5fbe4d6f85f220b16be68140233 100644 --- a/transcoder_all/layer_21_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_21_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_small_affine/config.json b/transcoder_all/layer_21_width_262k_l0_small_affine/config.json index f752f50f345a33e360efad45850deea4fdbd7c70..d7650cdeb1dfcc8bb8b601bc5cd625a52990d761 100644 --- a/transcoder_all/layer_21_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_21_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_big/config.json b/transcoder_all/layer_22_width_262k_l0_big/config.json index 645310c5c01a2123ccf75e1f4f8258075143fcfe..139bbaef1ba12fc2d2181c3a2685af78b339f391 100644 --- a/transcoder_all/layer_22_width_262k_l0_big/config.json +++ b/transcoder_all/layer_22_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_small/config.json b/transcoder_all/layer_23_width_16k_l0_small/config.json index 0cfbda05136b65ced73e3fa90e1d5b4b79f670a0..efd39eb074dc106ec636fde4dd6a34ad67215531 100644 --- a/transcoder_all/layer_23_width_16k_l0_small/config.json +++ b/transcoder_all/layer_23_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_big/config.json b/transcoder_all/layer_24_width_16k_l0_big/config.json index 70cba2e22f20b5d53057978dbcb274a28b4b2881..fc39efe5aba2db8246c673216efec3bdd3bf0775 100644 --- a/transcoder_all/layer_24_width_16k_l0_big/config.json +++ b/transcoder_all/layer_24_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_big_affine/config.json b/transcoder_all/layer_24_width_16k_l0_big_affine/config.json index b5fb08d5dc3036a182690424b0b932d831fbe2b7..6bda68213edfb9fe2216874e36527eb171f5baf7 100644 --- a/transcoder_all/layer_24_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_24_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_16k_l0_small/config.json b/transcoder_all/layer_24_width_16k_l0_small/config.json index 065c97a3cc37f60ea5cd96a964708471eec60b47..f1c3bef4bbf606623251b71bbca088f0a90471a8 100644 --- a/transcoder_all/layer_24_width_16k_l0_small/config.json +++ b/transcoder_all/layer_24_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_big/config.json b/transcoder_all/layer_24_width_262k_l0_big/config.json index 536be5bfc3ced231d4178737879ed49a704c3a44..5c388d019365747c483cb856619d05f0a9b843d2 100644 --- a/transcoder_all/layer_24_width_262k_l0_big/config.json +++ b/transcoder_all/layer_24_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small_affine/config.json b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json index e59854f167d85f3f170331f2aff6679e961204be..cdeb1e2b474ffdd36495fc9763aed90d7bed4a83 100644 --- a/transcoder_all/layer_25_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_big/config.json b/transcoder_all/layer_25_width_262k_l0_big/config.json index 93064417deb3405a05a019d730a1521339c04540..be16ccf8b991407beaa8be0901dfe84f0bfc8f8e 100644 --- a/transcoder_all/layer_25_width_262k_l0_big/config.json +++ b/transcoder_all/layer_25_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_small/config.json b/transcoder_all/layer_25_width_262k_l0_small/config.json index 70b85b613a4d155f2c14627e4ddcced719c38a11..272007160fa289b92a9cae271d837819fb18590a 100644 --- a/transcoder_all/layer_25_width_262k_l0_small/config.json +++ b/transcoder_all/layer_25_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_small_affine/config.json b/transcoder_all/layer_26_width_16k_l0_small_affine/config.json index d665737196ade85c11782a1f281a7db7e163cb76..97b60efd44c551cd78a060a3904ae93dadab89ae 100644 --- a/transcoder_all/layer_26_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_26_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_262k_l0_big/config.json b/transcoder_all/layer_26_width_262k_l0_big/config.json index 0928180f597165f331097cf4f3b064aa62eeb1d2..200917dd22b61163bb0c3751be61c6031a1f3ee3 100644 --- a/transcoder_all/layer_26_width_262k_l0_big/config.json +++ b/transcoder_all/layer_26_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_16k_l0_big_affine/config.json b/transcoder_all/layer_27_width_16k_l0_big_affine/config.json index 16693767f0b93d4b51517ff0f749afc2265a35f5..08995265f3a817ef5c5a616dffb1b40b97d65ced 100644 --- a/transcoder_all/layer_27_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_27_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_16k_l0_big/config.json b/transcoder_all/layer_28_width_16k_l0_big/config.json index 0f319d78ce990f3d4871f222348d6f9a1b4630db..0bbed730b61b26b55871f9dc0a261b7bcbd8d7e9 100644 --- a/transcoder_all/layer_28_width_16k_l0_big/config.json +++ b/transcoder_all/layer_28_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_small_affine/config.json b/transcoder_all/layer_29_width_16k_l0_small_affine/config.json index 26f7a1646c01952fd97ca415c3bfe71eb6937650..90738082d638d986e03aeeeeb6aa9c9d45abbc43 100644 --- a/transcoder_all/layer_29_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_29_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_16k_l0_big_affine/config.json b/transcoder_all/layer_30_width_16k_l0_big_affine/config.json index cd738603c3a5af7ee83f3b7f9677b99141d7f397..0357c95dbdc7e9a37580be4540f1e32fa07c8294 100644 --- a/transcoder_all/layer_30_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_30_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_16k_l0_small/config.json b/transcoder_all/layer_30_width_16k_l0_small/config.json index 864ad2120bc1258f0b4deaf4175368002d877d3f..5e7dec6d4b6a0f0c6ea8051f180daad49a2abf57 100644 --- a/transcoder_all/layer_30_width_16k_l0_small/config.json +++ b/transcoder_all/layer_30_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_262k_l0_big/config.json b/transcoder_all/layer_30_width_262k_l0_big/config.json index 8fc93fe93ce38d46e3c2e30ce07c7c905ef892ad..eaefb5f31cdd0f26f1f73f0b6310f6326839e9d7 100644 --- a/transcoder_all/layer_30_width_262k_l0_big/config.json +++ b/transcoder_all/layer_30_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_262k_l0_big_affine/config.json b/transcoder_all/layer_30_width_262k_l0_big_affine/config.json index 3037920d138a84208986dfada90bfe424ad20386..abad944b715aab58d4f6dee918e6474f8f18ef18 100644 --- a/transcoder_all/layer_30_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_30_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_16k_l0_big/config.json b/transcoder_all/layer_32_width_16k_l0_big/config.json index 3ad2f9ca43b584fc77856b6424d6f812dcb8e3c6..3db554f2348ab8465a61243564d08ad70f07c727 100644 --- a/transcoder_all/layer_32_width_16k_l0_big/config.json +++ b/transcoder_all/layer_32_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_262k_l0_big_affine/config.json b/transcoder_all/layer_32_width_262k_l0_big_affine/config.json index eb9d3945b77464e9239f7aebc916c1cc3615424e..1393bd489378d2ba0b49fc15e371316dd9850b7a 100644 --- a/transcoder_all/layer_32_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_32_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_big/config.json b/transcoder_all/layer_33_width_262k_l0_big/config.json index 4d4f56082e846c9b1f6b51e4708861c66e5243aa..f32dbf08f40cf8fa9413357a9b842531cd36bba0 100644 --- a/transcoder_all/layer_33_width_262k_l0_big/config.json +++ b/transcoder_all/layer_33_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_16k_l0_small/config.json b/transcoder_all/layer_34_width_16k_l0_small/config.json index 09270b5635547fa1c4d6556fe13ca9228e43652d..4bc053de27b3d1d6e462d5cbdacd4e5b0e67d339 100644 --- a/transcoder_all/layer_34_width_16k_l0_small/config.json +++ b/transcoder_all/layer_34_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_262k_l0_big/config.json b/transcoder_all/layer_34_width_262k_l0_big/config.json index 599a970976ca60226ce67ad01e27215158df0f81..e9daeabca0e14648afa1eda1f87195a14c649058 100644 --- a/transcoder_all/layer_34_width_262k_l0_big/config.json +++ b/transcoder_all/layer_34_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_262k_l0_big_affine/config.json b/transcoder_all/layer_34_width_262k_l0_big_affine/config.json index b87807874b53e22a4ef54b4643674f466e02a64f..e8e5d48da88d09a33fef1692d3d76b011f8680ac 100644 --- a/transcoder_all/layer_34_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_34_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_16k_l0_big_affine/config.json b/transcoder_all/layer_35_width_16k_l0_big_affine/config.json index 154e8a7265b0574892638b5ae34721b0a9f150b3..ad0f4c0c9ee6bf30b2cb61a2cf3df7630f8340f3 100644 --- a/transcoder_all/layer_35_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_35_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_16k_l0_small_affine/config.json b/transcoder_all/layer_35_width_16k_l0_small_affine/config.json index 3ae83b96e8cfe41ef2c02ef20480080ea1c09372..8d585735c304b5201eb305f92c4246d709ddbeb4 100644 --- a/transcoder_all/layer_35_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_35_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_262k_l0_big_affine/config.json b/transcoder_all/layer_35_width_262k_l0_big_affine/config.json index 47eb16fd7963e99812e09392a79529325e0bb23d..a8ceddaa86b4dcd5ee198d491693f948f9688362 100644 --- a/transcoder_all/layer_35_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_35_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_16k_l0_big/config.json b/transcoder_all/layer_36_width_16k_l0_big/config.json index c538d44d1ef62bf8ca8bf9a63d69b74f604e5253..29b2e847c69b8f0bb168ecacb7f9987e4ad5eb74 100644 --- a/transcoder_all/layer_36_width_16k_l0_big/config.json +++ b/transcoder_all/layer_36_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_262k_l0_big_affine/config.json b/transcoder_all/layer_36_width_262k_l0_big_affine/config.json index 57e8b157baa475fae485f814249b6abf200d2e80..72698ed1c219745c1977a56e96f453fb433456a9 100644 --- a/transcoder_all/layer_36_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_36_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_262k_l0_big/config.json b/transcoder_all/layer_37_width_262k_l0_big/config.json index af5c148d189a12306a2b6dfd486f719a56048289..9f41902efb46ec5e382e2c732be8451b42ec2f08 100644 --- a/transcoder_all/layer_37_width_262k_l0_big/config.json +++ b/transcoder_all/layer_37_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_big/config.json b/transcoder_all/layer_39_width_262k_l0_big/config.json index ba1339f76ac2550e5fec89c184822e7e2b936f0e..0d84baa613ee4d748488a1de15e304f6d6cd00be 100644 --- a/transcoder_all/layer_39_width_262k_l0_big/config.json +++ b/transcoder_all/layer_39_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_small/config.json b/transcoder_all/layer_39_width_262k_l0_small/config.json index a496c4fb6698192313163bf794726e939bb1b20d..2ab0e5e957964e0af557c0213fe21d6ad9014462 100644 --- a/transcoder_all/layer_39_width_262k_l0_small/config.json +++ b/transcoder_all/layer_39_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_small_affine/config.json b/transcoder_all/layer_39_width_262k_l0_small_affine/config.json index a0b0cc3a8a864a3afc06d548db8e4a019f36a30d..3d6d024afd606a145b3b706b790185fca70c4df8 100644 --- a/transcoder_all/layer_39_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_39_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json index 40e679abf43309e5219369838d09246b54d997b9..2bc9f779f485ae52d260d86d771de954fd3c5692 100644 --- a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_262k_l0_big_affine/config.json b/transcoder_all/layer_40_width_262k_l0_big_affine/config.json index bfeff55fefd287161502db805b7b9fd92b198a24..cd15f6efa435e6a564b4ecc83164127799e7c8d4 100644 --- a/transcoder_all/layer_40_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_40_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_16k_l0_small_affine/config.json b/transcoder_all/layer_42_width_16k_l0_small_affine/config.json index d016284fb6219785780cfbdbd972865c0c211845..5613477059211a887d7cab82e9d5033d7c2b1243 100644 --- a/transcoder_all/layer_42_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_42_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_262k_l0_big/config.json b/transcoder_all/layer_44_width_262k_l0_big/config.json index 6c371e7906669ccb60130792e059b9250c02b963..c3ccc83134b14f2ab32fe6b24f4f77c66ee24bba 100644 --- a/transcoder_all/layer_44_width_262k_l0_big/config.json +++ b/transcoder_all/layer_44_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_262k_l0_small/config.json b/transcoder_all/layer_44_width_262k_l0_small/config.json index 1aba03229854aa624d1d5acbebf16f135ea0fbc5..64ed4d87e8b3e2ebae6d46bcd18a0b01571b4305 100644 --- a/transcoder_all/layer_44_width_262k_l0_small/config.json +++ b/transcoder_all/layer_44_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_262k_l0_small_affine/config.json b/transcoder_all/layer_44_width_262k_l0_small_affine/config.json index 90ea6f2f6512f30c74597965358962d689e90981..5d2136a6b958e4a714864fe29fc06b924d467c29 100644 --- a/transcoder_all/layer_44_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_44_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_46_width_262k_l0_big_affine/config.json b/transcoder_all/layer_46_width_262k_l0_big_affine/config.json index a8e3695570afd20208ca14df8b9e7c8502c84b51..c055c78131d61904c44cba6f581b234008211efe 100644 --- a/transcoder_all/layer_46_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_46_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.46.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_16k_l0_big_affine/config.json b/transcoder_all/layer_47_width_16k_l0_big_affine/config.json index 615da02f9e08ef1dc4e0b7f788a18a68e2504292..89d7af3495c88294f7317d44116bb84e1607a0a3 100644 --- a/transcoder_all/layer_47_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_47_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_262k_l0_big/config.json b/transcoder_all/layer_47_width_262k_l0_big/config.json index f7e565ad3aaccc1bad887074374c228ab014e754..05b41ddcf9472326768f12a53821d8feb4979f01 100644 --- a/transcoder_all/layer_47_width_262k_l0_big/config.json +++ b/transcoder_all/layer_47_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_262k_l0_big_affine/config.json b/transcoder_all/layer_47_width_262k_l0_big_affine/config.json index 54a1126761b66f295258612e101bd4cce75b18ae..40523ea00a3a882991c0d9a3cde66f7274722966 100644 --- a/transcoder_all/layer_47_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_47_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_262k_l0_small/config.json b/transcoder_all/layer_47_width_262k_l0_small/config.json index 6d20cab088535b1ea1bc2961493804d17edc78ef..1f0c1d8ba02d3ee81fe81225c2262523edf2bccd 100644 --- a/transcoder_all/layer_47_width_262k_l0_small/config.json +++ b/transcoder_all/layer_47_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_big/config.json b/transcoder_all/layer_48_width_16k_l0_big/config.json index 67f323a1c3bc1c6c2f34fb7b064e04d21bb73cb9..41750e97d014f5cfa3f3fc1391f82c0e4985e882 100644 --- a/transcoder_all/layer_48_width_16k_l0_big/config.json +++ b/transcoder_all/layer_48_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_262k_l0_big/config.json b/transcoder_all/layer_48_width_262k_l0_big/config.json index d296bee8f361974bfd7a20562a0ad4dd8608595c..b2439929afe2256b86ae2589482e804514c8981d 100644 --- a/transcoder_all/layer_48_width_262k_l0_big/config.json +++ b/transcoder_all/layer_48_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small/config.json b/transcoder_all/layer_4_width_262k_l0_small/config.json index 136ad7128fd96cff8c8fcb1db4d3aa612d46e779..bed58349b9c819a0267f38aa77a32c2e816bac0b 100644 --- a/transcoder_all/layer_4_width_262k_l0_small/config.json +++ b/transcoder_all/layer_4_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json index 186ddb3052a9021eef0e0a93b8a9fb182d551559..8e98d1ae66b174ac654d32f0b241b34018b8b09a 100644 --- a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_16k_l0_big_affine/config.json b/transcoder_all/layer_50_width_16k_l0_big_affine/config.json index 8b42bc0e5a1215b40c109f18d8dccf8f7571c540..17a06c15e35a33cbcde62fcb585bcaedfb50362a 100644 --- a/transcoder_all/layer_50_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_50_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_262k_l0_big/config.json b/transcoder_all/layer_50_width_262k_l0_big/config.json index 7b01089785c28a13edd3279120df1723572d641b..3b50fdc45fde7d475fa1f5661d480a9140788fe2 100644 --- a/transcoder_all/layer_50_width_262k_l0_big/config.json +++ b/transcoder_all/layer_50_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_51_width_16k_l0_big_affine/config.json b/transcoder_all/layer_51_width_16k_l0_big_affine/config.json index 5f8d99fda3fef227bc61a80c42be57c9fbe3dd35..59200a112f53ce6066c597440d1fddf1a8cbe924 100644 --- a/transcoder_all/layer_51_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_51_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.51.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_262k_l0_big_affine/config.json b/transcoder_all/layer_52_width_262k_l0_big_affine/config.json index b05c84040ba36e12103bb5eee6b79a5501c08256..812f8d52445eeeb8be1fa828d9629e5b5fbd4cc1 100644 --- a/transcoder_all/layer_52_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_52_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_262k_l0_small_affine/config.json b/transcoder_all/layer_52_width_262k_l0_small_affine/config.json index fbbbc7038fa1d89a4410cc740d8886f3ab0352cb..a35ea51ae50b81ac7dbc71ed85cf6a5b03a17cfd 100644 --- a/transcoder_all/layer_52_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_52_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_262k_l0_big_affine/config.json b/transcoder_all/layer_53_width_262k_l0_big_affine/config.json index fa48f4b8b452a03d7eef9937968efd1e5a771ff3..7c7ce3caa818fab1e36eb5a84c0a21b6a4a8b42f 100644 --- a/transcoder_all/layer_53_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_53_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_262k_l0_small/config.json b/transcoder_all/layer_53_width_262k_l0_small/config.json index 64c98f54c9ca490a7d4da6de57b4f5e38efbec98..cdeece1a6932ef8796e726bf23dfd182ad2af7c4 100644 --- a/transcoder_all/layer_53_width_262k_l0_small/config.json +++ b/transcoder_all/layer_53_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_16k_l0_big_affine/config.json b/transcoder_all/layer_54_width_16k_l0_big_affine/config.json index b8f1c1f8a38435ee73089ec2ae6ab1a5bc552a39..3a9bfdeab587ee1a78e2b5f055bfdd9d3fb99a87 100644 --- a/transcoder_all/layer_54_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_54_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_16k_l0_small/config.json b/transcoder_all/layer_54_width_16k_l0_small/config.json index cca67e0ca523c19be3f72aa05552ae20b3bc603b..cf526c58b2fc9e73f3d019ed638e651d709a3116 100644 --- a/transcoder_all/layer_54_width_16k_l0_small/config.json +++ b/transcoder_all/layer_54_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_262k_l0_big/config.json b/transcoder_all/layer_55_width_262k_l0_big/config.json index 31df2140699fe7a6f9f573e0197524049d82bd71..52df8ede7a9e219e15774e37db78d2e15c239286 100644 --- a/transcoder_all/layer_55_width_262k_l0_big/config.json +++ b/transcoder_all/layer_55_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_262k_l0_small/config.json b/transcoder_all/layer_55_width_262k_l0_small/config.json index 0bddae85ca6e127a33352f880c6cf8ee660d0cd0..c7a52ec7777948965a21fa528e866fad4277a6eb 100644 --- a/transcoder_all/layer_55_width_262k_l0_small/config.json +++ b/transcoder_all/layer_55_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_262k_l0_small_affine/config.json b/transcoder_all/layer_55_width_262k_l0_small_affine/config.json index b708d691da9b17b4e0c499ca9c748bd9da554e46..7f00d9f340fa35e3b481c416c5db16ef9169cd10 100644 --- a/transcoder_all/layer_55_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_55_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_big/config.json b/transcoder_all/layer_56_width_262k_l0_big/config.json index af592f425d9261eed005c4b413ca67d3adff392b..cefe4ff238828c263368d6d21ae73c15e486701d 100644 --- a/transcoder_all/layer_56_width_262k_l0_big/config.json +++ b/transcoder_all/layer_56_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_262k_l0_small_affine/config.json b/transcoder_all/layer_57_width_262k_l0_small_affine/config.json index 7e2fa8906663b6c53e4b701e75fde60be81927e1..e3d439baf7f5a0aad41208d2f33a80755c82c648 100644 --- a/transcoder_all/layer_57_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_57_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_16k_l0_big/config.json b/transcoder_all/layer_59_width_16k_l0_big/config.json index f60c1fc80158d91d6bd1c204748db166448bace4..38197a744d58c1a2a6c83db94029721750b96c83 100644 --- a/transcoder_all/layer_59_width_16k_l0_big/config.json +++ b/transcoder_all/layer_59_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big/config.json b/transcoder_all/layer_5_width_16k_l0_big/config.json index 70444808fc77cfb25613e5b3692f19f26b103f24..77cb103d12b1250e17533db90dec69c380b2e82f 100644 --- a/transcoder_all/layer_5_width_16k_l0_big/config.json +++ b/transcoder_all/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 74, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_small/config.json b/transcoder_all/layer_5_width_262k_l0_small/config.json index 4be3e8c3ba2da665ff73d7362dfd59ad73ee4a6e..5e2ea705ec23856f2cb218975452f2b8bda58b64 100644 --- a/transcoder_all/layer_5_width_262k_l0_small/config.json +++ b/transcoder_all/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_16k_l0_big/config.json b/transcoder_all/layer_60_width_16k_l0_big/config.json index 223779aa31fc50bf1d6a12b456c1a916f796ea36..6e7c6b53599fb34c830aabfc8e8078bc1d6e71dd 100644 --- a/transcoder_all/layer_60_width_16k_l0_big/config.json +++ b/transcoder_all/layer_60_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_262k_l0_big_affine/config.json b/transcoder_all/layer_60_width_262k_l0_big_affine/config.json index 25e97095c8bbe8651fb5d054467585af84ad7fb6..88bf0182995c3cf16f5fcb0c5d47681ab57466cc 100644 --- a/transcoder_all/layer_60_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_60_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_16k_l0_small/config.json b/transcoder_all/layer_61_width_16k_l0_small/config.json index 2c33d1768cfc9534db927c263814fc6e62e44308..fba7391c62d14c01c7bedf5e15eda3ae91c8dacf 100644 --- a/transcoder_all/layer_61_width_16k_l0_small/config.json +++ b/transcoder_all/layer_61_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_big/config.json b/transcoder_all/layer_6_width_262k_l0_big/config.json index 68e256fbc2faed70802aca3858e187eba53e7214..c07bef3812ffa0b7d93d8f0d3a19d4b0a4070143 100644 --- a/transcoder_all/layer_6_width_262k_l0_big/config.json +++ b/transcoder_all/layer_6_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 77, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small/config.json b/transcoder_all/layer_9_width_262k_l0_small/config.json index b6990f0e3b4226d112b4b25458b36893e1437c90..66f76ae7834122d8cad9cf23693b60a167dcf00f 100644 --- a/transcoder_all/layer_9_width_262k_l0_small/config.json +++ b/transcoder_all/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json index 395b7ed3fbeacdf8d336d78f0b2966b5e03fbb78..da9947214caadbbdfbd0b976c3ae0cd957c4e4dc 100644 --- a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file