diff --git a/transcoder_all/layer_11_width_262k_l0_big_affine/config.json b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json index 1fc148ff076728560fc314905eac6ee5864d862b..6cc142c367ff6557ff238c882b4602ce0300e737 100644 --- a/transcoder_all/layer_11_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_11_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 91, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small/config.json b/transcoder_all/layer_11_width_262k_l0_small/config.json index 2c21aee4a20c2b88a26b8180abb63c0ecf593e73..8afe5fa8695d30cbeaef9d8a347fefe132873209 100644 --- a/transcoder_all/layer_11_width_262k_l0_small/config.json +++ b/transcoder_all/layer_11_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small_affine/config.json b/transcoder_all/layer_11_width_262k_l0_small_affine/config.json index 66ac3ff8ddc5665c33a9348985589ee5b604e82e..8aafdfefec4cc632da611e0d06fef4d17d70faf2 100644 --- a/transcoder_all/layer_11_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_11_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_big/config.json b/transcoder_all/layer_12_width_262k_l0_big/config.json index 2d553945497b2301afb150e52e1920391ec48d45..b062d93851bbaa65a3891d27e956ef5dd9e8d84d 100644 --- a/transcoder_all/layer_12_width_262k_l0_big/config.json +++ b/transcoder_all/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 94, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_small/config.json b/transcoder_all/layer_12_width_262k_l0_small/config.json index 16a24e4c56eb936d045ae63738d06470193c3f0c..a574fd2476caaadf5dfb1350881744ad5bf03ba7 100644 --- a/transcoder_all/layer_12_width_262k_l0_small/config.json +++ b/transcoder_all/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json index 8f5e4de4f599c62974858b48dbb2707d600117f3..bfae0c8c36a543bbf5ebf3967eb9b2fa2fc9c1d8 100644 --- a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 97, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small_affine/config.json b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json index 8d19a02953e16da66660cf5913ebb7ab8b33cc16..5aaf9c55c7b73fe2c0d5c16735934ffdfdc4314d 100644 --- a/transcoder_all/layer_13_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 16, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big_affine/config.json b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json index 205d498fbcc2c55a2bd04206d1649cee16bf79af..3abebd57b71b3efb702b6173d4c8967b9fcb029a 100644 --- a/transcoder_all/layer_15_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 103, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_small/config.json b/transcoder_all/layer_15_width_16k_l0_small/config.json index 23599dab50d41a7612c0764c260ce1e35445fd2e..de4dbe5a32aa9f5a3662d4b65f4e5099b844d757 100644 --- a/transcoder_all/layer_15_width_16k_l0_small/config.json +++ b/transcoder_all/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 17, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_big_affine/config.json b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json index 71efa7c5605913ac43e25025145746dc3cf4318e..dd9702c9a18be560ced4bbbf58b7aa5f72e21200 100644 --- a/transcoder_all/layer_16_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 106, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json index ae698be098c89fcbcca1879bef05d0ac2e2a1caf..81058edae812f7db428909599693c6bbdd1b477c 100644 --- a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 17, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big/config.json b/transcoder_all/layer_17_width_16k_l0_big/config.json index c58aeadb41954a0dd5907b05dcfa0deaeeb10a76..ad6f06e942f88818f4bf4d2b9b16fa5dddbcb493 100644 --- a/transcoder_all/layer_17_width_16k_l0_big/config.json +++ b/transcoder_all/layer_17_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 109, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small/config.json b/transcoder_all/layer_17_width_262k_l0_small/config.json index 486f32ff7c7d62d026b4435e55052c3b672f0c7d..b79a7bc9bd86e402a6df3f17f1d5d242d2fddd64 100644 --- a/transcoder_all/layer_17_width_262k_l0_small/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json index e2e3b4ad32989cacad70c5942d5e8ab1c1b03702..cd8c6f33c12d86adfba1cfa0990fdf37a6d9ce79 100644 --- a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_16k_l0_big/config.json b/transcoder_all/layer_18_width_16k_l0_big/config.json index ef522075e3c437dbf6c52b7212fbd78742eac199..b0919590bca793173da5469b36b65c414ca96ead 100644 --- a/transcoder_all/layer_18_width_16k_l0_big/config.json +++ b/transcoder_all/layer_18_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 112, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_big/config.json b/transcoder_all/layer_18_width_262k_l0_big/config.json index 17c29216bb2ed38143ed9b970caeac1be6919018..5f3b643944a713d80de99f03808952f676c7722d 100644 --- a/transcoder_all/layer_18_width_262k_l0_big/config.json +++ b/transcoder_all/layer_18_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 112, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_big_affine/config.json b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json index 97755b91489206c1275cdf36858231c510d3e5b0..3615a322d4feb385afb247f2cb6b9eab7bff96c9 100644 --- a/transcoder_all/layer_18_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 112, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_small/config.json b/transcoder_all/layer_19_width_16k_l0_small/config.json index 875cbf91ea5f5a1a07c4f9c4092785892db7d081..674122ac531cdcb063b2ece6ac871a256a48affb 100644 --- a/transcoder_all/layer_19_width_16k_l0_small/config.json +++ b/transcoder_all/layer_19_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_small/config.json b/transcoder_all/layer_19_width_262k_l0_small/config.json index 13558ca2a1a29a6b8cdc75376e7607af51a7bf92..3916679196d3c277567acf4437f4e2b97395767e 100644 --- a/transcoder_all/layer_19_width_262k_l0_small/config.json +++ b/transcoder_all/layer_19_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_big_affine/config.json b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json index 4e85dda0865d19e67f2090984fc55c1dfe040b34..8fbe29df9c00a34e5363647bf34f907465e6ec44 100644 --- a/transcoder_all/layer_1_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 62, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json index 9d09baca18ace5bc2f41104600eb8c9df6a334f6..4255b2373f6123c5e264c0da3744dc8344ab6187 100644 --- a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big_affine/config.json b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json index 7ef5b02e0e3681a0f9ab90d76cd85122b88b229a..92d9f91518c90d5a6ff49836c85345a98a3df308 100644 --- a/transcoder_all/layer_22_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_22_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_big_affine/config.json b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json index 74a72fcfeb3d59b2eba314ea67b8ed0e55421c04..371ddacc31e651c846f0471a1cdb48e5156e9432 100644 --- a/transcoder_all/layer_22_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_22_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_small_affine/config.json b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json index df7df892602fb507fbeaaef1000d7c7410409f43..db74d20c1ee752b26a316573d463b39877c2c3f9 100644 --- a/transcoder_all/layer_22_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_small_affine/config.json b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json index 08010a332fc84641c915b3eca25771e55b57e7b2..44e46bac66192f0bf85d6eccd8de5e79d883c5d5 100644 --- a/transcoder_all/layer_23_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_small/config.json b/transcoder_all/layer_23_width_262k_l0_small/config.json index 974ac05504e375f12516970993b44591e4fbe99d..24419169954331fcd0cb7239de8afc53ddbbd81a 100644 --- a/transcoder_all/layer_23_width_262k_l0_small/config.json +++ b/transcoder_all/layer_23_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_big_affine/config.json b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json index 6c26b89c0bb9f95bdd7ee3cbb5b98ff68377313e..59456ea991230ce793c058dabb4a9ff91e69ddff 100644 --- a/transcoder_all/layer_24_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_small_affine/config.json b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json index 8468226bbfb61f3db82c2b14a6e247de1d8add0a..b57f8233cb837f205a625cc0251eea942cf720c6 100644 --- a/transcoder_all/layer_24_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_24_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_small_affine/config.json b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json index a3fefd07bceac36d22c43e3472b2436354500749..e71a679b621f794c3a43f3de82caf43aa3bda0c0 100644 --- a/transcoder_all/layer_25_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_25_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_small_affine/config.json b/transcoder_all/layer_26_width_16k_l0_small_affine/config.json index 5a4ef77f1ee198fdb0aac71b759d330671fbf631..9ed71157f5cce8dd3b87e8318e0fb06578e6f5df 100644 --- a/transcoder_all/layer_26_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_26_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_16k_l0_small_affine/config.json b/transcoder_all/layer_27_width_16k_l0_small_affine/config.json index c62c221ed028ef41660142c5c370dd7edc3977fb..26992c8ce978580f1cab83656c6d41ac19ff8c17 100644 --- a/transcoder_all/layer_27_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_27_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_small/config.json b/transcoder_all/layer_27_width_262k_l0_small/config.json index 4d3ef02e62e4318dba3401a79a7faed93f85d50b..81df7cbe9dc4ffb137c2b45dfcc28cb3ec814ac8 100644 --- a/transcoder_all/layer_27_width_262k_l0_small/config.json +++ b/transcoder_all/layer_27_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_262k_l0_small_affine/config.json b/transcoder_all/layer_28_width_262k_l0_small_affine/config.json index 26da779d68776e45ea31d7454c11cdf7adc0f07a..4cd90da824dd757c2705612118f05e89065d9bb3 100644 --- a/transcoder_all/layer_28_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_28_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_big/config.json b/transcoder_all/layer_29_width_16k_l0_big/config.json index 67af62a209fe955e9e7d7f8ffa9db2033ab9fcd4..9824b9e290157e91528ecf650066a75e50d1943a 100644 --- a/transcoder_all/layer_29_width_16k_l0_big/config.json +++ b/transcoder_all/layer_29_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_small/config.json b/transcoder_all/layer_29_width_16k_l0_small/config.json index 082007f54d2bab291184e0626c96151766b7d66e..e89b2bb0f1cd8401bf4c34fbaad99c53cce61a49 100644 --- a/transcoder_all/layer_29_width_16k_l0_small/config.json +++ b/transcoder_all/layer_29_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_262k_l0_small_affine/config.json b/transcoder_all/layer_29_width_262k_l0_small_affine/config.json index f0a5196c74cb8e0184d2b2b63107335215f42030..60f9461eae184af034a833fc8b89340534727ec8 100644 --- a/transcoder_all/layer_29_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_29_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big/config.json b/transcoder_all/layer_2_width_16k_l0_big/config.json index 6a462fa6f817e091092b34773aadb03d9be27f5e..06599d0b61504bcae4ad0d525adcfe49c44a739b 100644 --- a/transcoder_all/layer_2_width_16k_l0_big/config.json +++ b/transcoder_all/layer_2_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 65, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big/config.json b/transcoder_all/layer_2_width_262k_l0_big/config.json index 276ec2a47c1c42655b53b06f7e94d3ba27b5ff70..8c61e0588913042513de0378d32da8bbc8a267f4 100644 --- a/transcoder_all/layer_2_width_262k_l0_big/config.json +++ b/transcoder_all/layer_2_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 65, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_16k_l0_big/config.json b/transcoder_all/layer_30_width_16k_l0_big/config.json index 6bf3278a659db5f22ae696f7f3809c27baaf5c65..143e842b3c9d6cbd49558742085caf5d9f9f1566 100644 --- a/transcoder_all/layer_30_width_16k_l0_big/config.json +++ b/transcoder_all/layer_30_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_16k_l0_big/config.json b/transcoder_all/layer_31_width_16k_l0_big/config.json index 389e2df91be059a3953deac269b172bd09e15d3c..2df0934d98dd0b17cd0f1ce6ac707269d486d707 100644 --- a/transcoder_all/layer_31_width_16k_l0_big/config.json +++ b/transcoder_all/layer_31_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_small_affine/config.json b/transcoder_all/layer_31_width_262k_l0_small_affine/config.json index ff72e8de151f337dbe6d756f75d804b5e90cd6d2..47544c610aa1c2903b1f4392f2b7ea08b3c4224f 100644 --- a/transcoder_all/layer_31_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_31_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_16k_l0_big_affine/config.json b/transcoder_all/layer_32_width_16k_l0_big_affine/config.json index bef8fa3edef138bad906ee98b074b9b493e5c190..7d92422b8720a1dbbef9ed9f00cce0d91a335c6f 100644 --- a/transcoder_all/layer_32_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_32_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_small_affine/config.json b/transcoder_all/layer_33_width_262k_l0_small_affine/config.json index 920f53085f38453358bc9312cd188251319ea389..f550851ca0508ba2b0a7f33c08f315c728adcd18 100644 --- a/transcoder_all/layer_33_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_33_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_262k_l0_small_affine/config.json b/transcoder_all/layer_34_width_262k_l0_small_affine/config.json index e8c4c4262514c8eaade037b6947084533a3baaeb..8a29ac1d8ea1fa4e6ba5b0d7ef4fbd2aedb11da2 100644 --- a/transcoder_all/layer_34_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_34_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_16k_l0_small_affine/config.json b/transcoder_all/layer_35_width_16k_l0_small_affine/config.json index 256b976d6c247051ecddf7e9e2619bf62033224f..3a46cf9259276152b8ac11564bc14837adaa7b4f 100644 --- a/transcoder_all/layer_35_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_35_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_262k_l0_small_affine/config.json b/transcoder_all/layer_35_width_262k_l0_small_affine/config.json index 93da0cdd5a3fa5392621e33c78fb1d523fbc9f54..41cd92260de1b9a0e9aa10109255000b7ab22d51 100644 --- a/transcoder_all/layer_35_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_35_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_262k_l0_big/config.json b/transcoder_all/layer_36_width_262k_l0_big/config.json index 87103664002448c3f57942d3d59a8f304e6ec1f4..34a29d0417adbf03976989c1e89363b4f75b39c1 100644 --- a/transcoder_all/layer_36_width_262k_l0_big/config.json +++ b/transcoder_all/layer_36_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_big/config.json b/transcoder_all/layer_37_width_16k_l0_big/config.json index eb8be6d889e71a2e86e9cc1115bcc207b28c6e5b..0007d127dad5bfa79dd1d38a894a254c52002ce3 100644 --- a/transcoder_all/layer_37_width_16k_l0_big/config.json +++ b/transcoder_all/layer_37_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_small/config.json b/transcoder_all/layer_37_width_16k_l0_small/config.json index be496508ffb91b568e2fd0fcc1441c65cf124113..49eb0ec9fa90c8c8bdcb98ba516e3ef83599ca22 100644 --- a/transcoder_all/layer_37_width_16k_l0_small/config.json +++ b/transcoder_all/layer_37_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_big/config.json b/transcoder_all/layer_38_width_262k_l0_big/config.json index acf9357db8196ec11e12115170deb53dc8c6780d..2eeaacb8efe6fb712838aac66f9c55f3e5c64333 100644 --- a/transcoder_all/layer_38_width_262k_l0_big/config.json +++ b/transcoder_all/layer_38_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_small_affine/config.json b/transcoder_all/layer_38_width_262k_l0_small_affine/config.json index c3a09e75415ddd486431b837da6756fb060e2a6d..d9eea01ebf1a6c28081ec7f885f679d9636e4ce3 100644 --- a/transcoder_all/layer_38_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_38_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_16k_l0_small/config.json b/transcoder_all/layer_39_width_16k_l0_small/config.json index c406bfcc143312354ac06d2c2d6a99077c8b3384..4a39284a272f1cdcaddb2a279268564310e79889 100644 --- a/transcoder_all/layer_39_width_16k_l0_small/config.json +++ b/transcoder_all/layer_39_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_big/config.json b/transcoder_all/layer_39_width_262k_l0_big/config.json index 6209ca21b647ea1defa61e4b805e78359db2b01d..c20ea7d14954b74fe78e78ee32c5593563e24245 100644 --- a/transcoder_all/layer_39_width_262k_l0_big/config.json +++ b/transcoder_all/layer_39_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_small_affine/config.json b/transcoder_all/layer_39_width_262k_l0_small_affine/config.json index d299f6de31bca47f68ebc1b9b18c84addb80eba1..546da5a3aa44077e4f5b6e3eeaec6d29d82fa468 100644 --- a/transcoder_all/layer_39_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_39_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small/config.json b/transcoder_all/layer_3_width_262k_l0_small/config.json index 8f82c944924fff48ea2390ab5cfc42338464a6fa..dead965f9303fd0bd797e2985688f0d29b558370 100644 --- a/transcoder_all/layer_3_width_262k_l0_small/config.json +++ b/transcoder_all/layer_3_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_16k_l0_big/config.json b/transcoder_all/layer_40_width_16k_l0_big/config.json index 36ca32309b21f9781ae1d812556c652a2a2d167c..feaa7df585afdeb08e4febd9779984c461005532 100644 --- a/transcoder_all/layer_40_width_16k_l0_big/config.json +++ b/transcoder_all/layer_40_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_16k_l0_small_affine/config.json b/transcoder_all/layer_40_width_16k_l0_small_affine/config.json index 9dd795f1f9ef956a068422c9b528e8433080f61d..4a57e2cf6e457dc83ec7ca7b5823103e2ed4644e 100644 --- a/transcoder_all/layer_40_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_40_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_262k_l0_big/config.json b/transcoder_all/layer_40_width_262k_l0_big/config.json index 1a7701af50f9b0a3ab244cce81b2234c929fd360..f762ca3b545a1d98a555c00e7351ca4ee375a90c 100644 --- a/transcoder_all/layer_40_width_262k_l0_big/config.json +++ b/transcoder_all/layer_40_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_16k_l0_small_affine/config.json b/transcoder_all/layer_41_width_16k_l0_small_affine/config.json index 2583e39c3b925e3ba052eefbfdca60856b4bbd00..d15df29aa17721ec1ba0d6a301254f967458616d 100644 --- a/transcoder_all/layer_41_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_41_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_262k_l0_small_affine/config.json b/transcoder_all/layer_42_width_262k_l0_small_affine/config.json index c5538acaa06cd94c5e6094b9e2e2d7a6d4b10d5b..efe91a0e1fc9d9f2c54250cb81ecd6609bc52b88 100644 --- a/transcoder_all/layer_42_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_42_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_262k_l0_big_affine/config.json b/transcoder_all/layer_43_width_262k_l0_big_affine/config.json index 9cff6030c8347fe42bf2ec2ea32a51b6389d3e80..e1d2ce1c3901da1d120d650ce6d2fdcb1651243c 100644 --- a/transcoder_all/layer_43_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_43_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_262k_l0_small/config.json b/transcoder_all/layer_44_width_262k_l0_small/config.json index f27074f7176313d3f562e10539f59a5968f2fc31..f8c0e189a4b56efd508993b638ddb6b5d3a95cd5 100644 --- a/transcoder_all/layer_44_width_262k_l0_small/config.json +++ b/transcoder_all/layer_44_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_262k_l0_big/config.json b/transcoder_all/layer_45_width_262k_l0_big/config.json index cf1eec304a869c2d3b11effe09097e2fc821a5fb..5a10033f87a9d0c7f703ac4a2006961d8c6bb2dd 100644 --- a/transcoder_all/layer_45_width_262k_l0_big/config.json +++ b/transcoder_all/layer_45_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_16k_l0_big_affine/config.json b/transcoder_all/layer_47_width_16k_l0_big_affine/config.json index 4f7433d1633917654957280e0de90041523f842e..875ad0b0b8ae3f89a4ac3f9efc797d5ae737ac64 100644 --- a/transcoder_all/layer_47_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_47_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_big_affine/config.json b/transcoder_all/layer_48_width_16k_l0_big_affine/config.json index 8bdb8c33c24dacde477349ff270334283350a353..cd5db509b0c6d3b0168864b091b4c38a4611e5d6 100644 --- a/transcoder_all/layer_48_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_48_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_small/config.json b/transcoder_all/layer_48_width_16k_l0_small/config.json index 3961410b0bfba107e80983ded5e308c54de47aaf..1f96ef565c7e4e811e7e21f4abda4c74cafe94d8 100644 --- a/transcoder_all/layer_48_width_16k_l0_small/config.json +++ b/transcoder_all/layer_48_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_16k_l0_big/config.json b/transcoder_all/layer_49_width_16k_l0_big/config.json index 9ec5f996af1e41b389322666ee31b288af83b5cf..6dbef7f7d66feb5a98727373f1987ceadeaae234 100644 --- a/transcoder_all/layer_49_width_16k_l0_big/config.json +++ b/transcoder_all/layer_49_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_16k_l0_big_affine/config.json b/transcoder_all/layer_49_width_16k_l0_big_affine/config.json index d17f95324fe91a33b48da13722940a1019b6bc9b..b4a8e14fb0f4cc0f6cdaf55d7af48e68113bf1b7 100644 --- a/transcoder_all/layer_49_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_49_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json index b3c3d147638f5c347a90044a4bd915050a489537..083d4799acc5d63b836bdde1adde0defcc5cf3fc 100644 --- a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json index 62c71c4f12108e13848ba9b573a189396f4153ea..cf8ee6d6b9997a61f00f6e2635401698e800b1ce 100644 --- a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_262k_l0_big_affine/config.json b/transcoder_all/layer_50_width_262k_l0_big_affine/config.json index 3bbd510fadbaea2edc39773509313dbe6d486a59..eb4b916a0d1bc0b2bc190096bfdd362be5c5bec6 100644 --- a/transcoder_all/layer_50_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_50_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_262k_l0_small_affine/config.json b/transcoder_all/layer_50_width_262k_l0_small_affine/config.json index 7f880f52ebda86b161fdbbd47c1f903e0b6a7fc1..c256a4a0052b81850cc0e1a308c3b9874ccf12b7 100644 --- a/transcoder_all/layer_50_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_50_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_262k_l0_small/config.json b/transcoder_all/layer_52_width_262k_l0_small/config.json index 4aed8cc70c54cf9363aab441fdce72963347c2f6..5b2ba8d501786441e8bfe3adb0a858b49f23fd8e 100644 --- a/transcoder_all/layer_52_width_262k_l0_small/config.json +++ b/transcoder_all/layer_52_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_262k_l0_small_affine/config.json b/transcoder_all/layer_52_width_262k_l0_small_affine/config.json index 1385d8ad4b392906a3739c1b3e34c9b862d9e4d6..d463241b018b47f7eab1582d2d22e769f321e687 100644 --- a/transcoder_all/layer_52_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_52_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_16k_l0_big/config.json b/transcoder_all/layer_53_width_16k_l0_big/config.json index 7e714c4d5c6f911c97b72d74ccffc8350689361d..5a2db28eea2fe15f44b1ba277cbb6c7e5c1fa6fa 100644 --- a/transcoder_all/layer_53_width_16k_l0_big/config.json +++ b/transcoder_all/layer_53_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_16k_l0_big_affine/config.json b/transcoder_all/layer_53_width_16k_l0_big_affine/config.json index 86fca6f20d10ce5637ea9308f02b0cc08096a3c2..dc4f954c11d76946a51369a59b19b4bf3e912120 100644 --- a/transcoder_all/layer_53_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_53_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_262k_l0_small_affine/config.json b/transcoder_all/layer_54_width_262k_l0_small_affine/config.json index 6adc7cf34b58e613e3f3c8ee4d6a38053ccfca43..13f82936c00a6a8083b07cc01d51b28002de85de 100644 --- a/transcoder_all/layer_54_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_54_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_262k_l0_big_affine/config.json b/transcoder_all/layer_55_width_262k_l0_big_affine/config.json index 59195506fe38bc75b6a1b3e00d136e797beb0f3e..c6f3e3af97da5eb1ea197d0b3b0b9ea26c0e532f 100644 --- a/transcoder_all/layer_55_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_55_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_big/config.json b/transcoder_all/layer_56_width_262k_l0_big/config.json index 2c49f2aa9df18c44801752f27fca29854dde74ae..d3c18adb3d294f88db57c1d22a381480f62a3b5a 100644 --- a/transcoder_all/layer_56_width_262k_l0_big/config.json +++ b/transcoder_all/layer_56_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_big_affine/config.json b/transcoder_all/layer_56_width_262k_l0_big_affine/config.json index 00ad6be489be9931a63b2e0c4319bd3c0f512d94..58758e463b0939c764dc62e778859e83bef2497d 100644 --- a/transcoder_all/layer_56_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_56_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_big/config.json b/transcoder_all/layer_57_width_16k_l0_big/config.json index c5a956f6b93e1983015a96de370e9c86aca63168..2829fa214dfecc60a638dc79293c06197478e62a 100644 --- a/transcoder_all/layer_57_width_16k_l0_big/config.json +++ b/transcoder_all/layer_57_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_small_affine/config.json b/transcoder_all/layer_57_width_16k_l0_small_affine/config.json index f1c1bb0320906c6d69f2245be3c072f6438d22c5..2a205989df278a70a34f1658fdfd371c1ffa64e0 100644 --- a/transcoder_all/layer_57_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_57_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_262k_l0_small/config.json b/transcoder_all/layer_59_width_262k_l0_small/config.json index 77b88dbbdbc97b855899306cd10965151b42fa53..36f143d3bcddbb15b4d7b454fc85f22470fc3dcc 100644 --- a/transcoder_all/layer_59_width_262k_l0_small/config.json +++ b/transcoder_all/layer_59_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big/config.json b/transcoder_all/layer_5_width_262k_l0_big/config.json index c0bfa46fd959235e67e899b939a1db1c1b25756a..3fcf1e6943d0e98aec770aed4fe0061cc6765981 100644 --- a/transcoder_all/layer_5_width_262k_l0_big/config.json +++ b/transcoder_all/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 74, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_16k_l0_big/config.json b/transcoder_all/layer_60_width_16k_l0_big/config.json index 093c85baacfaeb6224e6287905ce77cbb9791819..0bb090f71ca4f17265a5b2f9125622ae11b257dc 100644 --- a/transcoder_all/layer_60_width_16k_l0_big/config.json +++ b/transcoder_all/layer_60_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_262k_l0_big_affine/config.json b/transcoder_all/layer_61_width_262k_l0_big_affine/config.json index 629c2924ccf17676ef74e9f229988421873b0d99..23fb5c881ba566541c7583194ed358bb736ebc66 100644 --- a/transcoder_all/layer_61_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_61_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_big/config.json b/transcoder_all/layer_6_width_16k_l0_big/config.json index 5c543990e6166f3be70583a1e2553972511a2a28..c717f087613287422ed2728338f229ea7522a067 100644 --- a/transcoder_all/layer_6_width_16k_l0_big/config.json +++ b/transcoder_all/layer_6_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 77, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_small/config.json b/transcoder_all/layer_6_width_262k_l0_small/config.json index cc9d646942038b214446bccb895cfa918cc39261..499e07af586256c9ddd34a855f52e63bae211841 100644 --- a/transcoder_all/layer_6_width_262k_l0_small/config.json +++ b/transcoder_all/layer_6_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 12, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_big/config.json b/transcoder_all/layer_7_width_16k_l0_big/config.json index c4f615d458480a2d5195c5cebc628bebf9902e75..af3b8c98d8d311a5453c1b100aa12b5c4c8d3127 100644 --- a/transcoder_all/layer_7_width_16k_l0_big/config.json +++ b/transcoder_all/layer_7_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big/config.json b/transcoder_all/layer_8_width_262k_l0_big/config.json index 511eadd50ff14cfaeac14b177494724a8db1b5d3..b8ce6231ef73c7490b7cc9be6d66946939dd6bfa 100644 --- a/transcoder_all/layer_8_width_262k_l0_big/config.json +++ b/transcoder_all/layer_8_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 83, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big_affine/config.json b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json index 57525d303b3da28037ef07283a2e4ab590864708..691ebd6ce0ba647f985cd81dbab4a6229722bdde 100644 --- a/transcoder_all/layer_8_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 83, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big/config.json b/transcoder_all/layer_9_width_16k_l0_big/config.json index 614808560f10b3a43ea497300864604762fc945a..022ec09f70c81f797e5af8492c1d54dd3505c718 100644 --- a/transcoder_all/layer_9_width_16k_l0_big/config.json +++ b/transcoder_all/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 86, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json index 4962abe9568f3a2821f3bbe0cd0c703c68badace..8b07356a14b1cb83eec9c3912dd966416b5f2736 100644 --- a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-pt", + "model_name": "google/gemma-3-27b-pt", "architecture": "jump_relu", "l0": 14, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file