diff --git a/transcoder_all/layer_10_width_16k_l0_big_affine/config.json b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json index 58723ee706d86b8b8dd6428b10bf2f87c317c91a..3db329e7ff04518a53965cdfa22c16eee8985b77 100644 --- a/transcoder_all/layer_10_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_10_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 89, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big/config.json b/transcoder_all/layer_10_width_262k_l0_big/config.json index dd0850590d238af6cd232193e46a6986d6baa069..dc6c2b225d97bced65c55ba133eedd6fed74a1db 100644 --- a/transcoder_all/layer_10_width_262k_l0_big/config.json +++ b/transcoder_all/layer_10_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 89, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_big/config.json b/transcoder_all/layer_11_width_16k_l0_big/config.json index ac2382ba60f9d76cd96b75463ca43d4fcc15aee2..f00855413e65d8e0712afb55a5a1cfa111bc7e40 100644 --- a/transcoder_all/layer_11_width_16k_l0_big/config.json +++ b/transcoder_all/layer_11_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 91, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_big/config.json b/transcoder_all/layer_11_width_262k_l0_big/config.json index 56c236348ae5a100839b6fe3db2c432198f198cc..b9dfde78750116c6cf6a705941dbacb6a3897032 100644 --- a/transcoder_all/layer_11_width_262k_l0_big/config.json +++ b/transcoder_all/layer_11_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 91, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_small/config.json b/transcoder_all/layer_12_width_16k_l0_small/config.json index bdf7f1cab6c19fade8331ac2c882b9377cfb18f2..67ad0c3e0ae869780214882b10405318ef119fb7 100644 --- a/transcoder_all/layer_12_width_16k_l0_small/config.json +++ b/transcoder_all/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_big_affine/config.json b/transcoder_all/layer_14_width_262k_l0_big_affine/config.json index 916bd3f5c65b075d011b9d2566c170647dddd43c..a0775e22c2a21e0cbf153b768e5b484d904cfcf5 100644 --- a/transcoder_all/layer_14_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_14_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_small_affine/config.json b/transcoder_all/layer_15_width_262k_l0_small_affine/config.json index b2f71c5f4c2b387299445abbf71be1e0ade5111c..8ac1244bb301859c1195dc5ab22d9c06027d8de0 100644 --- a/transcoder_all/layer_15_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_15_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_big/config.json b/transcoder_all/layer_16_width_16k_l0_big/config.json index 94496134ee3e217e79adc8a95ec3a4af8eb14474..39dfa714ce0e1433c530721f4ab30ab7850b0394 100644 --- a/transcoder_all/layer_16_width_16k_l0_big/config.json +++ b/transcoder_all/layer_16_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 106, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big_affine/config.json b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json index 1da103fb3baddb61645b48244ccfd5aa9e98a6cc..a66dc9a4fc30547505c237941c0e6992c6f8c67e 100644 --- a/transcoder_all/layer_17_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 109, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_small/config.json b/transcoder_all/layer_17_width_16k_l0_small/config.json index 53c6bf7086b832ab3811ebd923d891f28375ceb0..6a25ccbae02db0674059de719afab5b3ae1287fc 100644 --- a/transcoder_all/layer_17_width_16k_l0_small/config.json +++ b/transcoder_all/layer_17_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_16k_l0_big/config.json b/transcoder_all/layer_19_width_16k_l0_big/config.json index 0ed1d8a6d93ca4ae0a0091f65f2b91288dc4d705..610b68e0e68f20a3f0df6ff95e3e13830bbd4939 100644 --- a/transcoder_all/layer_19_width_16k_l0_big/config.json +++ b/transcoder_all/layer_19_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 115, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_big_affine/config.json b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json index 5786af47b2597c769501a510873a404a5c4ffc83..687c6e02ed9ef4262defdbfaecefe9002ee5f99a 100644 --- a/transcoder_all/layer_19_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_19_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 115, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_big_affine/config.json b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json index 982f60293ca1a5408033aee142e9fd6d3a631e5a..22b092129158f7b670e71e678297dafc66b7e97f 100644 --- a/transcoder_all/layer_1_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_1_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 62, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_big/config.json b/transcoder_all/layer_20_width_262k_l0_big/config.json index 434bb5321281e86d8e43db36e918f4bf5b265d1e..dda1607b87459e9b463392fd4a1c2f1d2f64a2f5 100644 --- a/transcoder_all/layer_20_width_262k_l0_big/config.json +++ b/transcoder_all/layer_20_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 118, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_262k_l0_big_affine/config.json b/transcoder_all/layer_21_width_262k_l0_big_affine/config.json index e04e9459eadcc65b763cb374483764a30409edf1..90eb93ee80d9d9aaf235adb6a0261dfba73d67f0 100644 --- a/transcoder_all/layer_21_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_21_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_16k_l0_big/config.json b/transcoder_all/layer_22_width_16k_l0_big/config.json index 444243bf2c31658befa282c3e9f6e0ebc9e2e97d..9907a91d089ad459a5a08f8d77b35a9a9ac6ed68 100644 --- a/transcoder_all/layer_22_width_16k_l0_big/config.json +++ b/transcoder_all/layer_22_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_big/config.json b/transcoder_all/layer_23_width_16k_l0_big/config.json index bfee078f2c6113e6a9a7195fc39f1de3fcf4e858..d106ae3052fc8bb6b2523c4739379e0973eeb44f 100644 --- a/transcoder_all/layer_23_width_16k_l0_big/config.json +++ b/transcoder_all/layer_23_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_small_affine/config.json b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json index 52f2d6ba3ddd81833813592e716187e5d1bbc762..bda6bd0cafbaae9ad0a881fe3cfa189f5fd00a0a 100644 --- a/transcoder_all/layer_23_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_23_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_small/config.json b/transcoder_all/layer_24_width_262k_l0_small/config.json index a0135f25fbafea5c5d1770d28a611cba496e5403..d70140b7cacb82deaa0df385646b12dccaf2b825 100644 --- a/transcoder_all/layer_24_width_262k_l0_small/config.json +++ b/transcoder_all/layer_24_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_small/config.json b/transcoder_all/layer_26_width_16k_l0_small/config.json index 0fff2ae82cfd8d5734f623c228ba0e880a83d9ed..99204aefbedb430a150be49cc7447a475df6e7d1 100644 --- a/transcoder_all/layer_26_width_16k_l0_small/config.json +++ b/transcoder_all/layer_26_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_16k_l0_small/config.json b/transcoder_all/layer_27_width_16k_l0_small/config.json index 276df67d55ca4955df3f20d490a102c8a713d5d3..dc10878fa74cf4a9529db007093bc6d56727f02c 100644 --- a/transcoder_all/layer_27_width_16k_l0_small/config.json +++ b/transcoder_all/layer_27_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_16k_l0_small_affine/config.json b/transcoder_all/layer_27_width_16k_l0_small_affine/config.json index 6b23a79b9285aa7c2ca49e57948d32270fae0e14..51000fac5fe9455752bf2669f87e1cc2b777b278 100644 --- a/transcoder_all/layer_27_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_27_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_262k_l0_small/config.json b/transcoder_all/layer_28_width_262k_l0_small/config.json index d56e6a00e195bc300133d028c8b942766fdd5e88..ce988aafa4fdf1d1bace9694e3edbd63fe57c400 100644 --- a/transcoder_all/layer_28_width_262k_l0_small/config.json +++ b/transcoder_all/layer_28_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_262k_l0_big_affine/config.json b/transcoder_all/layer_29_width_262k_l0_big_affine/config.json index 80a099bcece0350371cfa3b1c35c11e9510cd4ab..4ac34f6e5d19e92061c9ec9f030c442b90cbbc87 100644 --- a/transcoder_all/layer_29_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_29_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_small/config.json b/transcoder_all/layer_2_width_16k_l0_small/config.json index ef063bf8cbf94a3ae5ec1da3eb6b42aa2ed4456b..0da3c9e1d32ee781b068bda62c8e6a48c9724e2a 100644 --- a/transcoder_all/layer_2_width_16k_l0_small/config.json +++ b/transcoder_all/layer_2_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_small_affine/config.json b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json index 397da71e4d32fb5b75d72ee0c9c1f737e66ade89..adad932fe8396b5620ccefab63f03df8c1d13576 100644 --- a/transcoder_all/layer_2_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big/config.json b/transcoder_all/layer_2_width_262k_l0_big/config.json index 3ffdaac4309d5d258b1cf6292595a5d24e391f5b..e2fcc751a1670afd0405c49aecb5e9b552a66ea4 100644 --- a/transcoder_all/layer_2_width_262k_l0_big/config.json +++ b/transcoder_all/layer_2_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 65, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big_affine/config.json b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json index 93d19e0ec23c55c62b611441fa73de1054f850e5..54f2b8f05c327dac9b571478e14559edae4f6ffd 100644 --- a/transcoder_all/layer_2_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_2_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 65, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_16k_l0_small_affine/config.json b/transcoder_all/layer_30_width_16k_l0_small_affine/config.json index cdba3b802f0e87833db19b0c99a9c249de4f9b0b..e6782621cdeb91f66e82f1f1fd2de229938d7933 100644 --- a/transcoder_all/layer_30_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_30_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_31_width_262k_l0_big_affine/config.json b/transcoder_all/layer_31_width_262k_l0_big_affine/config.json index 53fcdb0990310aa9f26cdeae77e323a402a97136..9585874f90bbda95cebec16d861ac3bceb09f0ea 100644 --- a/transcoder_all/layer_31_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_31_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.31.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_16k_l0_small/config.json b/transcoder_all/layer_32_width_16k_l0_small/config.json index e4a4c3d8d48ebaee70dd13b4603a88161c4b3fb5..e1295c699ca2982b96cb8bc631bd7e5ca9369e5e 100644 --- a/transcoder_all/layer_32_width_16k_l0_small/config.json +++ b/transcoder_all/layer_32_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_16k_l0_small_affine/config.json b/transcoder_all/layer_33_width_16k_l0_small_affine/config.json index bc13bd88a3385a25f156b0b10f6f71615963eff3..6cc03bd2eebe5b8e9791773da85734684fa53fd5 100644 --- a/transcoder_all/layer_33_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_33_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_16k_l0_big_affine/config.json b/transcoder_all/layer_34_width_16k_l0_big_affine/config.json index ea82e912604cc60f7aaf64fd472752106b45bcbb..427af736662363a5dbb102f10c0c70ab28823de2 100644 --- a/transcoder_all/layer_34_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_34_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_16k_l0_small_affine/config.json b/transcoder_all/layer_34_width_16k_l0_small_affine/config.json index 9e2725423a5ec2ab07e72f7265e6b56b4af82020..4be9662a4a5a64f7fd8789491076ec0c3839993b 100644 --- a/transcoder_all/layer_34_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_34_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_262k_l0_big/config.json b/transcoder_all/layer_36_width_262k_l0_big/config.json index 5306ceed5df0d9970834dbeafedc76dd37027943..2548ba833ada7574911ad9d4320fe1cabe46cb32 100644 --- a/transcoder_all/layer_36_width_262k_l0_big/config.json +++ b/transcoder_all/layer_36_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_262k_l0_small_affine/config.json b/transcoder_all/layer_37_width_262k_l0_small_affine/config.json index a5218a7ec75a9d1667d3711f7d7ea915d460196f..d1ac4f0eff5539fe5e26f1ff899f28bc8e9acdbe 100644 --- a/transcoder_all/layer_37_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_37_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_16k_l0_small/config.json b/transcoder_all/layer_38_width_16k_l0_small/config.json index 58be2fd7e4bb4f864736f49538397923f2464225..83de3d93d88a81852fe93113fb18a47b0e6d3159 100644 --- a/transcoder_all/layer_38_width_16k_l0_small/config.json +++ b/transcoder_all/layer_38_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_small_affine/config.json b/transcoder_all/layer_38_width_262k_l0_small_affine/config.json index 5e9a370906524ac9a56dfb0f65ed68c8419eaa1f..3ac06d868d1d656127c11a17c243897ca6d6df5d 100644 --- a/transcoder_all/layer_38_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_38_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_16k_l0_big/config.json b/transcoder_all/layer_39_width_16k_l0_big/config.json index e519ce64e8514236d6655c9dfa9bdaf0598e4af5..d54cc72a12d8c49abc2893cae236dad87cc95f88 100644 --- a/transcoder_all/layer_39_width_16k_l0_big/config.json +++ b/transcoder_all/layer_39_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json index b36d28af7d44c4858cce30877b2e33bf23e047ce..10d43e9bf026b90140ecb43622e4c8630b541333 100644 --- a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big/config.json b/transcoder_all/layer_3_width_262k_l0_big/config.json index d1e109e01246bd34b0fdd27de9f58c35d091ecfa..8a7300035fbf16c968e014dd30dad087627f9090 100644 --- a/transcoder_all/layer_3_width_262k_l0_big/config.json +++ b/transcoder_all/layer_3_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 68, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_16k_l0_big_affine/config.json b/transcoder_all/layer_40_width_16k_l0_big_affine/config.json index 6470615974e3f13d662b124c543ff42764964a55..24d3d7aeeddd541de7f7b18de06a222a807adc72 100644 --- a/transcoder_all/layer_40_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_40_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_16k_l0_small_affine/config.json b/transcoder_all/layer_41_width_16k_l0_small_affine/config.json index aa3c3eadd3146fb2f577641dd96b248f297f1652..59eafbb97e744dfbf706d547586a15c43a6ffccf 100644 --- a/transcoder_all/layer_41_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_41_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_262k_l0_small_affine/config.json b/transcoder_all/layer_41_width_262k_l0_small_affine/config.json index c7d4b59e131aff92bee9863aafc1d1bd2e3205ac..195c3ce370549a7eb0de6a27e8b3d5b2a1ccfcda 100644 --- a/transcoder_all/layer_41_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_41_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_42_width_16k_l0_big_affine/config.json b/transcoder_all/layer_42_width_16k_l0_big_affine/config.json index 69fd92b3c703bfafa7bb51df2b9ae4c56b9e3672..7dcb290a4b4e7141870ddf9144b56023d79f3cb2 100644 --- a/transcoder_all/layer_42_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_42_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.42.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_16k_l0_big_affine/config.json b/transcoder_all/layer_43_width_16k_l0_big_affine/config.json index 0890baef15ebc4fc0083512e3cb08013f17081b0..643e62c9145657fe6cdbef8e2034f3a5a163e9bc 100644 --- a/transcoder_all/layer_43_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_43_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_16k_l0_small_affine/config.json b/transcoder_all/layer_43_width_16k_l0_small_affine/config.json index 0734de7486d2ee12b46c6b0e6d9ce3d9c268b512..8bedd47cccb21b28e32286adbcff3e245e05c738 100644 --- a/transcoder_all/layer_43_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_43_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_262k_l0_big_affine/config.json b/transcoder_all/layer_43_width_262k_l0_big_affine/config.json index bb4ad8ef781ffef5aa849356e197fdec9d94bfcd..b15083ccd4ddcacaf0a8f5edb5a47c6fffd6d561 100644 --- a/transcoder_all/layer_43_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_43_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_16k_l0_big_affine/config.json b/transcoder_all/layer_44_width_16k_l0_big_affine/config.json index 3498ac3b8e9c6f38914fa3218c57434ec684d134..82d92a8585cc3f962a44bc3f96f7312e2a63b314 100644 --- a/transcoder_all/layer_44_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_44_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_45_width_16k_l0_small/config.json b/transcoder_all/layer_45_width_16k_l0_small/config.json index 214dd17d1ad24a06ad94909a79e5a27e34db0e7f..0237aaf77fa4a7a1e313666384745afe61b53cef 100644 --- a/transcoder_all/layer_45_width_16k_l0_small/config.json +++ b/transcoder_all/layer_45_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.45.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_48_width_16k_l0_small_affine/config.json b/transcoder_all/layer_48_width_16k_l0_small_affine/config.json index 9a4a8d9ac7f23714d7a65bfee973e81ee5f2e0ff..f62d408653547bd795024a595b681033e2f7cd5f 100644 --- a/transcoder_all/layer_48_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_48_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.48.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.48.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_16k_l0_small/config.json b/transcoder_all/layer_49_width_16k_l0_small/config.json index b951d34d0f9009728f778062296423af2f372a4e..4a27ae7f0701d3bce67a100dabbb64bf477632e1 100644 --- a/transcoder_all/layer_49_width_16k_l0_small/config.json +++ b/transcoder_all/layer_49_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_16k_l0_small_affine/config.json b/transcoder_all/layer_49_width_16k_l0_small_affine/config.json index 3c24bcda9edda95b48be34bedbf8ccbb97a672b3..249e9615ea331ccf999a0cdef2d5020724a49b8c 100644 --- a/transcoder_all/layer_49_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_49_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_262k_l0_small_affine/config.json b/transcoder_all/layer_49_width_262k_l0_small_affine/config.json index 1faf60caf5ca7e1319de38e0fe84a6140bba7be7..eb43f306fa663f9ff6fcac7632ccd62098eb84b2 100644 --- a/transcoder_all/layer_49_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_49_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_big_affine/config.json b/transcoder_all/layer_4_width_16k_l0_big_affine/config.json index 677173c6f97233efe115220c54af6a792fa4087c..6136c341c84f7bd078595da62192a392f874ce50 100644 --- a/transcoder_all/layer_4_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_4_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 71, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_big_affine/config.json b/transcoder_all/layer_4_width_262k_l0_big_affine/config.json index c335d0edbee8a4be67f742ca06075aa123537df3..7e5a0da30c018ddbd7ead038a522efc473abefcc 100644 --- a/transcoder_all/layer_4_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_4_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 71, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_262k_l0_small/config.json b/transcoder_all/layer_50_width_262k_l0_small/config.json index bacf1db4c17a50a6206ff2b8470a60df9823c093..6b4cfa6d86af24aa57ac35e6d7eb05bf9d730309 100644 --- a/transcoder_all/layer_50_width_262k_l0_small/config.json +++ b/transcoder_all/layer_50_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_16k_l0_big/config.json b/transcoder_all/layer_52_width_16k_l0_big/config.json index 0f42e400b482feb91002bd6943772f57d3c4f1f9..a868c122d49b6cbcc7e112769398b5210af08a78 100644 --- a/transcoder_all/layer_52_width_16k_l0_big/config.json +++ b/transcoder_all/layer_52_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_53_width_16k_l0_small_affine/config.json b/transcoder_all/layer_53_width_16k_l0_small_affine/config.json index 2b7f6719362f02c3d29d951e7bf9a92250a6025a..e88b8c55ec20a8bb42928ca5c3ae8810f661b39a 100644 --- a/transcoder_all/layer_53_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_53_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.53.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.53.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_262k_l0_small/config.json b/transcoder_all/layer_54_width_262k_l0_small/config.json index 3e753d5cd211ea1ce71cecaf690019c801e0fb33..86a3bd94d9b400021af704dedad0ab5db71073de 100644 --- a/transcoder_all/layer_54_width_262k_l0_small/config.json +++ b/transcoder_all/layer_54_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_16k_l0_big/config.json b/transcoder_all/layer_55_width_16k_l0_big/config.json index b711b893d6f18e161221db3da97f8cf1b01fe3a6..1772d82288fbf9a4604af801d030738a1762fa4e 100644 --- a/transcoder_all/layer_55_width_16k_l0_big/config.json +++ b/transcoder_all/layer_55_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_16k_l0_big/config.json b/transcoder_all/layer_56_width_16k_l0_big/config.json index 16ea83d685d85b4e6feeab2d2d3031c941874fcb..5dfa6b050887acda8d2fa0a25187fb7994009175 100644 --- a/transcoder_all/layer_56_width_16k_l0_big/config.json +++ b/transcoder_all/layer_56_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_16k_l0_big_affine/config.json b/transcoder_all/layer_56_width_16k_l0_big_affine/config.json index adbf601bb53270196f31545b64a92e70677040b7..b06abd23e095c42923bf29d6ced04400a838365b 100644 --- a/transcoder_all/layer_56_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_56_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_big/config.json b/transcoder_all/layer_57_width_16k_l0_big/config.json index 737bf181adeabf2df072f9493a7b0ac066d8af7b..47bf5c2165da5ae6ce1166bbeb4b104d4d80734e 100644 --- a/transcoder_all/layer_57_width_16k_l0_big/config.json +++ b/transcoder_all/layer_57_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_262k_l0_big/config.json b/transcoder_all/layer_59_width_262k_l0_big/config.json index cd3a3d8d92d6d024c9407b1e1e58647459e66e04..fee8ab31cc530a3aa553f26fdc5f108d956b719a 100644 --- a/transcoder_all/layer_59_width_262k_l0_big/config.json +++ b/transcoder_all/layer_59_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_59_width_262k_l0_small/config.json b/transcoder_all/layer_59_width_262k_l0_small/config.json index 335c67b76436495e5869649bd4684602fa1a91ea..f574bacf93273a3efe671f154fef7f5ae8b7b78f 100644 --- a/transcoder_all/layer_59_width_262k_l0_small/config.json +++ b/transcoder_all/layer_59_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.59.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_262k_l0_small_affine/config.json b/transcoder_all/layer_60_width_262k_l0_small_affine/config.json index 1bf83a1f97170becdbc26845ad88991d148bec9c..0fff7046765c6db48e8f7706edca55669a5e8b77 100644 --- a/transcoder_all/layer_60_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_60_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_16k_l0_big_affine/config.json b/transcoder_all/layer_61_width_16k_l0_big_affine/config.json index dcd188f9a33f3f052daa9a406b423bf4b1af1318..11e818b6bdebce3fed133fc793021b0a94c43dd8 100644 --- a/transcoder_all/layer_61_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_61_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_16k_l0_small_affine/config.json b/transcoder_all/layer_61_width_16k_l0_small_affine/config.json index af66824be9c0b091ce089d3eb791351705956a8c..6e7e1b9eea9d964a3f3e9a3c18a1de828140b16c 100644 --- a/transcoder_all/layer_61_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_61_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_61_width_262k_l0_small/config.json b/transcoder_all/layer_61_width_262k_l0_small/config.json index 9e0d9f3202b3e2ad43f6e4476b7e31512e5cdc45..e4d95448b43aeb70fafd8edd20395dd48b282534 100644 --- a/transcoder_all/layer_61_width_262k_l0_small/config.json +++ b/transcoder_all/layer_61_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.61.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_big_affine/config.json b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json index 20fc34a8417e56ed3825e5702ac605027049557d..de1f41557aa6c7cf84cb53b3be81b7eee7b25287 100644 --- a/transcoder_all/layer_6_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 77, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_small/config.json b/transcoder_all/layer_6_width_262k_l0_small/config.json index 4e568da7be0381f68c6fac54ba103045989b3d8c..b4b263e1727cb1f5728deb94b041bae7edf0a8e6 100644 --- a/transcoder_all/layer_6_width_262k_l0_small/config.json +++ b/transcoder_all/layer_6_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json index 2c19a18ef73535ca80b2bc6488de26908b1cf66c..0e4ef3ef3ae63f5782cab96bed72740b1869b02d 100644 --- a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big/config.json b/transcoder_all/layer_7_width_262k_l0_big/config.json index 4c1b9ad576f4c3e7f704a44243f8f798e685b72e..88d5e5a2722148e863710db2e1baf2e8ded9fa02 100644 --- a/transcoder_all/layer_7_width_262k_l0_big/config.json +++ b/transcoder_all/layer_7_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_big_affine/config.json b/transcoder_all/layer_8_width_16k_l0_big_affine/config.json index 739503f20591d47d54ccbd0c994372c740094d47..c193dd773bc25d24a87f813d24310aed2c031b3b 100644 --- a/transcoder_all/layer_8_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_8_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 83, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big_affine/config.json b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json index 0bd69b9ada3e6d3436300f67b6a58df16f26da9a..f53ca933b969de98e78a1d5e3bc207300b2338d7 100644 --- a/transcoder_all/layer_8_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_8_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 83, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big_affine/config.json b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json index d13737a478b0ddf21a24903870831dbc077b3cfc..fe44a5f271557b7294830b2b701e1aeb60ae66b8 100644 --- a/transcoder_all/layer_9_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 86, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file