diff --git a/transcoder_all/layer_12_width_16k_l0_big/config.json b/transcoder_all/layer_12_width_16k_l0_big/config.json index 8f6771cc0d10546f1a063860d310b58e5486e690..9c63187cc9fd39fbed7a1044ba3dfa58d06309ea 100644 --- a/transcoder_all/layer_12_width_16k_l0_big/config.json +++ b/transcoder_all/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 94, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json index e6d0a915f21762ce97bbe108bdaceb4efa73e5ab..edb165fd2e72340d9ce716eb47efb31baf294610 100644 --- a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 97, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big/config.json b/transcoder_all/layer_13_width_262k_l0_big/config.json index c1a478ebbd453fcd0dd3234a66bd8371230ddd42..db53a7f82bdc8fa9cb2e10d2220d70f1aace3dbf 100644 --- a/transcoder_all/layer_13_width_262k_l0_big/config.json +++ b/transcoder_all/layer_13_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 97, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_small_affine/config.json b/transcoder_all/layer_14_width_262k_l0_small_affine/config.json index b4edb85bad297b5ee39fb67d1772848f7587abc8..b68dfd358daa399680e2f6da8435edee0c2f1a37 100644 --- a/transcoder_all/layer_14_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_14_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big/config.json b/transcoder_all/layer_15_width_16k_l0_big/config.json index 47ebd757998c8fa696c8fea556c7aeb00597de21..59128bf965bda0d2e1b900c7f0f94fa9eb59ee89 100644 --- a/transcoder_all/layer_15_width_16k_l0_big/config.json +++ b/transcoder_all/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 103, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big/config.json b/transcoder_all/layer_15_width_262k_l0_big/config.json index c9eac05a6cc9705e59bc374094bf7dc52ffd545c..af943e283ed8a9d2ed0fc6e82d94719b0ddee15c 100644 --- a/transcoder_all/layer_15_width_262k_l0_big/config.json +++ b/transcoder_all/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 103, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json index 90e8a669a50f4c40aea2263dc6f2386e80a08429..f273aadd3bf8a4b372b77ae37a5dc67d63e81def 100644 --- a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_big_affine/config.json b/transcoder_all/layer_19_width_16k_l0_big_affine/config.json index a1164841629417551987675babbb7133cb67ca4b..474ef7d8ff2326a4c87b1c25c42238bc2bb9559d 100644 --- a/transcoder_all/layer_19_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_19_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 115, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_small_affine/config.json b/transcoder_all/layer_19_width_16k_l0_small_affine/config.json index 4db77c4b25e6468567b3ab08ee58f6545dcc8823..de759d7f68f02de8c22b567c95ab23b342f91660 100644 --- a/transcoder_all/layer_19_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_19_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big/config.json b/transcoder_all/layer_19_width_262k_l0_big/config.json index a7e17761d3dae573c8a35d67c7c578f378433cf8..b2f7ba8888354e1dd34c6b22c2cfe8e9c08137a4 100644 --- a/transcoder_all/layer_19_width_262k_l0_big/config.json +++ b/transcoder_all/layer_19_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 115, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_small_affine/config.json b/transcoder_all/layer_19_width_262k_l0_small_affine/config.json index 255cc7cb614a8a375b45fd1d2b004cd855e23686..1795a047595f36881bba54e431b43338d9d2a8de 100644 --- a/transcoder_all/layer_19_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_19_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_small/config.json b/transcoder_all/layer_1_width_16k_l0_small/config.json index 72b02c03876827057984093d5b70f9efc014dcac..1e50d530a29615075cfd4751f38e8a36bf705f72 100644 --- a/transcoder_all/layer_1_width_16k_l0_small/config.json +++ b/transcoder_all/layer_1_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_big/config.json b/transcoder_all/layer_20_width_16k_l0_big/config.json index 3542d0e9f633580803d6969c36dba4de664246e9..47930256bcfa33e98b9ea6439941cf5c823be7eb 100644 --- a/transcoder_all/layer_20_width_16k_l0_big/config.json +++ b/transcoder_all/layer_20_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 118, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_16k_l0_big_affine/config.json b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json index 5f21319fe298a998abce60f75a1d01286c4f0f7e..e1fe8c3fbfafcbe913ba5653b08abc218ff645fc 100644 --- a/transcoder_all/layer_20_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_20_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 118, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_small_affine/config.json b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json index b325825ec685f2c58fb7502715321817f1676dbe..0bc4806c9d265263ca27ed2f19f781b347d03f3a 100644 --- a/transcoder_all/layer_22_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_22_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_small_affine/config.json b/transcoder_all/layer_23_width_262k_l0_small_affine/config.json index 22d3f25d6950a46b14bd60cfacc9c716de6e08be..da7700320389fdf38d47ba0b26b02127ab3ba70f 100644 --- a/transcoder_all/layer_23_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_23_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_16k_l0_big/config.json b/transcoder_all/layer_25_width_16k_l0_big/config.json index 02aa6b0a10f9fd12ff261bb79749251f6e4a1842..8aa064db71058681df10f331a4d0b4cf2975ca6e 100644 --- a/transcoder_all/layer_25_width_16k_l0_big/config.json +++ b/transcoder_all/layer_25_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_262k_l0_small/config.json b/transcoder_all/layer_26_width_262k_l0_small/config.json index 70d2184fda94e4508a91d26529dc8e5c3f955619..e7bbb0c9df94c46976504a2b4a6045d81abd3cbc 100644 --- a/transcoder_all/layer_26_width_262k_l0_small/config.json +++ b/transcoder_all/layer_26_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_262k_l0_small_affine/config.json b/transcoder_all/layer_26_width_262k_l0_small_affine/config.json index 153e37a394db77640e9aec93c9a6799d10ee9f10..0304a75dde20954e70ef5ede1f2b2920b20985f3 100644 --- a/transcoder_all/layer_26_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_26_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_16k_l0_big/config.json b/transcoder_all/layer_27_width_16k_l0_big/config.json index a38e523f8e568a9ef2d79e248e2fa30f3947b520..de830224c0d8e6c7f094070b6ab41e6c97fb9981 100644 --- a/transcoder_all/layer_27_width_16k_l0_big/config.json +++ b/transcoder_all/layer_27_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_16k_l0_big_affine/config.json b/transcoder_all/layer_28_width_16k_l0_big_affine/config.json index 46778f277af134495219c39c0856d67836fca8e8..7926d780a23983e704757239d7221dac7fd70773 100644 --- a/transcoder_all/layer_28_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_28_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_262k_l0_small_affine/config.json b/transcoder_all/layer_28_width_262k_l0_small_affine/config.json index d46be4969dd81dc2fed154c236cffe2327c1831e..4673156b3e50a2da435686b60ca9befc1681afb2 100644 --- a/transcoder_all/layer_28_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_28_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_small/config.json b/transcoder_all/layer_29_width_16k_l0_small/config.json index 92bfcad78cade8e0527bbe1e8c238e6ca811432e..a23f4a008ba7ea15282cd10812aa940ab6222e47 100644 --- a/transcoder_all/layer_29_width_16k_l0_small/config.json +++ b/transcoder_all/layer_29_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small/config.json b/transcoder_all/layer_2_width_262k_l0_small/config.json index c4104b30fafb93def248dce85bf3d43ef060247a..7a4f8530cdeaf5c660d61bc3d753bf9c048010bf 100644 --- a/transcoder_all/layer_2_width_262k_l0_small/config.json +++ b/transcoder_all/layer_2_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_262k_l0_small_affine/config.json b/transcoder_all/layer_30_width_262k_l0_small_affine/config.json index 824c4fca709aff421289fa6a59812c3745ea5c28..2c48249d1277971f9331520e2c6e424f188839c7 100644 --- a/transcoder_all/layer_30_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_30_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_262k_l0_small_affine/config.json b/transcoder_all/layer_32_width_262k_l0_small_affine/config.json index 091c4358c7d81a4fd3b49dd9b2ef332eb9b3463e..c6968b91c84057c6d83b8a4528d4e57684d567f2 100644 --- a/transcoder_all/layer_32_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_32_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_16k_l0_small/config.json b/transcoder_all/layer_33_width_16k_l0_small/config.json index 9d9aac06d8922e69501aa621469d399aa9430728..b97aeeb774843b423c6a6da0ef2557f57e58437f 100644 --- a/transcoder_all/layer_33_width_16k_l0_small/config.json +++ b/transcoder_all/layer_33_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_big/config.json b/transcoder_all/layer_37_width_16k_l0_big/config.json index 6ab2c7029dfe8a188be394f684e0f650f02f3a4a..e27a7c5ce179f80235546a4066a54904e91eca7b 100644 --- a/transcoder_all/layer_37_width_16k_l0_big/config.json +++ b/transcoder_all/layer_37_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_big_affine/config.json b/transcoder_all/layer_37_width_16k_l0_big_affine/config.json index 29579f2b837bf6e87ace399ddec5ff090454fd17..4d92ca6da78b34ac48f75a063a05093abf5fcbe8 100644 --- a/transcoder_all/layer_37_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_37_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_16k_l0_small/config.json b/transcoder_all/layer_39_width_16k_l0_small/config.json index 43e392e81ec62a3a1e6107404f0baa385939866f..9a355f102e8c3ed0c2e885cec72fff81cbf90556 100644 --- a/transcoder_all/layer_39_width_16k_l0_small/config.json +++ b/transcoder_all/layer_39_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_262k_l0_big_affine/config.json b/transcoder_all/layer_39_width_262k_l0_big_affine/config.json index 90147a8a71be2f46755d3bec8a506aa4a9ce1d0b..7145902c0aeb39c8228a30ad7b4fdd7e07105c98 100644 --- a/transcoder_all/layer_39_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_39_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_big_affine/config.json b/transcoder_all/layer_3_width_16k_l0_big_affine/config.json index 736d7226e35c1c43cc9b50035129fd38ac5f00a1..5e7a21e251d4e7d12a71a734b45580fa4726d00d 100644 --- a/transcoder_all/layer_3_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_3_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 68, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_262k_l0_big/config.json b/transcoder_all/layer_41_width_262k_l0_big/config.json index d5b9d2ffbe829adf29cb3d3f30804e35a2f68dcc..861dadcc4b3a3dba7b9656a04582e8a2dffda0ce 100644 --- a/transcoder_all/layer_41_width_262k_l0_big/config.json +++ b/transcoder_all/layer_41_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_16k_l0_big/config.json b/transcoder_all/layer_42_width_16k_l0_big/config.json index d9d1291b0c34eea5605e7ff9c3edf5b8ae0ea87d..02bbf1f4fadff985f1110cf74a7c5054813c83b7 100644 --- a/transcoder_all/layer_42_width_16k_l0_big/config.json +++ b/transcoder_all/layer_42_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_262k_l0_big/config.json b/transcoder_all/layer_42_width_262k_l0_big/config.json index 5ba4829a27a57a82231da02b79001629f4fc03f3..04ee2549694f11b5cd96a325691619634666ac82 100644 --- a/transcoder_all/layer_42_width_262k_l0_big/config.json +++ b/transcoder_all/layer_42_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_262k_l0_big/config.json b/transcoder_all/layer_43_width_262k_l0_big/config.json index f7d1e20cc43d829fb5d5d983b4f40ef01704aef7..26caaae98df999d949f7998f1e423a8d553981ce 100644 --- a/transcoder_all/layer_43_width_262k_l0_big/config.json +++ b/transcoder_all/layer_43_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_262k_l0_big_affine/config.json b/transcoder_all/layer_45_width_262k_l0_big_affine/config.json index 4b16976266c5306ce4cc850ce963ba0763b277fe..9b828768a06137f57eb03a2a4b351b97019a9d8d 100644 --- a/transcoder_all/layer_45_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_45_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_46_width_262k_l0_big/config.json b/transcoder_all/layer_46_width_262k_l0_big/config.json index 57a6427f7e7de02b5897dba4dfa6baa50cfa82c7..2aa5e343ade02fed7cf8986486ed7007928140f9 100644 --- a/transcoder_all/layer_46_width_262k_l0_big/config.json +++ b/transcoder_all/layer_46_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.46.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_46_width_262k_l0_small_affine/config.json b/transcoder_all/layer_46_width_262k_l0_small_affine/config.json index 9df986e816e2424f9e859afcf6fd0039c20a12c4..508143f9102d1f450cc85de780918c5e9c37a20f 100644 --- a/transcoder_all/layer_46_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_46_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.46.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_16k_l0_small_affine/config.json b/transcoder_all/layer_47_width_16k_l0_small_affine/config.json index e342682a548b46b5dd27b70bf3d567c368d423af..31ca06f98dad2bc6a81ebf8d7e95fabe5df23812 100644 --- a/transcoder_all/layer_47_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_47_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_262k_l0_big_affine/config.json b/transcoder_all/layer_48_width_262k_l0_big_affine/config.json index 91d00c8d5ca9d3b7b8edeef49276f7d185426fc7..55462ba8917bf63593a7b37bbf25f1effbc4647c 100644 --- a/transcoder_all/layer_48_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_48_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_262k_l0_big_affine/config.json b/transcoder_all/layer_49_width_262k_l0_big_affine/config.json index fcd1347563840b3bc95e7511bb8937301caf4bb7..0f44143e112d0517ebd9d371050ca80096d5039d 100644 --- a/transcoder_all/layer_49_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_49_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_51_width_262k_l0_small/config.json b/transcoder_all/layer_51_width_262k_l0_small/config.json index 3881c545fdd2a27683cc9a0d6fbaa3101ec398c5..61d153c48c3d95795ef3c0e455faa3c58277412c 100644 --- a/transcoder_all/layer_51_width_262k_l0_small/config.json +++ b/transcoder_all/layer_51_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.51.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_16k_l0_small/config.json b/transcoder_all/layer_53_width_16k_l0_small/config.json index 3cb565481287de4a35df7603f657eac6f48c5448..f0a11bf7510bb6593df628e28926685ddc22f5ad 100644 --- a/transcoder_all/layer_53_width_16k_l0_small/config.json +++ b/transcoder_all/layer_53_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_262k_l0_small_affine/config.json b/transcoder_all/layer_53_width_262k_l0_small_affine/config.json index 71409121fd25dd222fe7eda21b373724d257c713..7e5ac4786f216c3a23c46987c6d16718f31346b7 100644 --- a/transcoder_all/layer_53_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_53_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_16k_l0_small/config.json b/transcoder_all/layer_55_width_16k_l0_small/config.json index 38e601f29f6278842160d399157ddaba8b61da62..4dfc22a93b2be6374fe9a2de41562b29d4d2b780 100644 --- a/transcoder_all/layer_55_width_16k_l0_small/config.json +++ b/transcoder_all/layer_55_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_16k_l0_small_affine/config.json b/transcoder_all/layer_55_width_16k_l0_small_affine/config.json index d56c5892543b42599ba83072289a4d0f135ffbe4..32022ca06f8dbbea86e8dc451ed1c27f61424200 100644 --- a/transcoder_all/layer_55_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_55_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_262k_l0_big_affine/config.json b/transcoder_all/layer_55_width_262k_l0_big_affine/config.json index 9fa9261ddfb09bb9ed05a2c22fdafb3e420a01d8..6558798147730e303e02f332dd5c61310a2f83de 100644 --- a/transcoder_all/layer_55_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_55_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_small/config.json b/transcoder_all/layer_56_width_262k_l0_small/config.json index e9d0bb52a6df636c4ffee978c72a649779abb777..62b06a1404287a47800d83416003cfe7e26a077d 100644 --- a/transcoder_all/layer_56_width_262k_l0_small/config.json +++ b/transcoder_all/layer_56_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_262k_l0_small_affine/config.json b/transcoder_all/layer_56_width_262k_l0_small_affine/config.json index 1b3c2cd25704b4cf3e9f744525d7a216197174a3..b97a90ddd3ca94b1c78a97ba04d8137c89080e96 100644 --- a/transcoder_all/layer_56_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_56_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_small/config.json b/transcoder_all/layer_57_width_16k_l0_small/config.json index 0843ebdffa454f83f603e663e77607a2d87637ac..811a3dfc2cba8148ef51967988cffaca8101ba56 100644 --- a/transcoder_all/layer_57_width_16k_l0_small/config.json +++ b/transcoder_all/layer_57_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_16k_l0_big_affine/config.json b/transcoder_all/layer_58_width_16k_l0_big_affine/config.json index 7858c7153bac39bdbf0dc3f8b34b0bd1d0348241..3b42c5e4beeae11160b61149c0152b7a2c023eec 100644 --- a/transcoder_all/layer_58_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_58_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_262k_l0_small/config.json b/transcoder_all/layer_58_width_262k_l0_small/config.json index e63e84b3349a11addb0ab8765cf092409118d598..3cc023af00e7abd3b8975c3d4df852162ad7a571 100644 --- a/transcoder_all/layer_58_width_262k_l0_small/config.json +++ b/transcoder_all/layer_58_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big_affine/config.json b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json index c9189080613f6590ff9a0f8680c02e48ca2727ca..736e86026b2d4dad97dbd4478f37e337efc68efa 100644 --- a/transcoder_all/layer_5_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 74, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big/config.json b/transcoder_all/layer_5_width_262k_l0_big/config.json index efb5ec786da69fbfbc67691b68f57763fd40cb29..c26a1d0be4ed5c750e2858521d1a9540146e1caa 100644 --- a/transcoder_all/layer_5_width_262k_l0_big/config.json +++ b/transcoder_all/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 74, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big_affine/config.json b/transcoder_all/layer_5_width_262k_l0_big_affine/config.json index 6128e569d3507d86b7b952c01bd304bf19e5cbb7..0d9f0666dcc8bfef8454966b7a0a1e78a20cb481 100644 --- a/transcoder_all/layer_5_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_5_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 74, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_small_affine/config.json b/transcoder_all/layer_5_width_262k_l0_small_affine/config.json index 3a578887ffcc15dab18a083748b4a65fc5520d9a..a8f00cc521195a00ee11b687b7078dd80d95f533 100644 --- a/transcoder_all/layer_5_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_5_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_16k_l0_big_affine/config.json b/transcoder_all/layer_60_width_16k_l0_big_affine/config.json index 91dfd95aef5ed8265fabc870d6baf7ca645eaca8..1687abed6803e1a57df7bed8cda26fb1c001c224 100644 --- a/transcoder_all/layer_60_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_60_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_16k_l0_small_affine/config.json b/transcoder_all/layer_60_width_16k_l0_small_affine/config.json index 3cbfb6012eb57e3b53ae3bb495b009ff6cc72581..5182581dbeb790ae79e3590f369a3f5ac962ee03 100644 --- a/transcoder_all/layer_60_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_60_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_small/config.json b/transcoder_all/layer_6_width_16k_l0_small/config.json index 0aee1ec9110224446f46fb2494f37c5a2f04c541..727262dfc61f2ae6a51caa0ddd2e289d0acfefd8 100644 --- a/transcoder_all/layer_6_width_16k_l0_small/config.json +++ b/transcoder_all/layer_6_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_big/config.json b/transcoder_all/layer_7_width_16k_l0_big/config.json index 056bab98c6f87fa00af9f8dc06b7b4f06129dc75..39a9481e8e79e7410291a492be49c3c8aefaaa9a 100644 --- a/transcoder_all/layer_7_width_16k_l0_big/config.json +++ b/transcoder_all/layer_7_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_big_affine/config.json b/transcoder_all/layer_7_width_16k_l0_big_affine/config.json index 4a60608574185ea1537c489c0538af4cf15f4a78..81a9cad0369ced6b5826957f6b8f3a351c2583c3 100644 --- a/transcoder_all/layer_7_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_7_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small_affine/config.json b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json index 30590ab32bfb631b6728adb0602c606501c4a330..8968dae9f965cdc3df27be80062f501be4edf49d 100644 --- a/transcoder_all/layer_7_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small/config.json b/transcoder_all/layer_9_width_16k_l0_small/config.json index ac5fe117ef6b4df44c10ce02be2e6c846b677b41..fdcd1a1670af0ef905553edce5be8d2934602337 100644 --- a/transcoder_all/layer_9_width_16k_l0_small/config.json +++ b/transcoder_all/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file