diff --git a/transcoder_all/layer_0_width_16k_l0_big/config.json b/transcoder_all/layer_0_width_16k_l0_big/config.json index 8a7258f6ffc7cdfff4635989c4d8a511d648dc3c..cc09037bd9fe4d3d3f871e35a634be06fbab9616 100644 --- a/transcoder_all/layer_0_width_16k_l0_big/config.json +++ b/transcoder_all/layer_0_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_big/config.json b/transcoder_all/layer_10_width_16k_l0_big/config.json index 8b17626b8044ecbed0d55703806a1632b3f85b2b..1ea32488fb254d5bd85037d11677f8b5da9b1735 100644 --- a/transcoder_all/layer_10_width_16k_l0_big/config.json +++ b/transcoder_all/layer_10_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 89, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small/config.json b/transcoder_all/layer_10_width_16k_l0_small/config.json index e3694b67570c1580d74adbb11c1374d440768713..c86f050f5ac5b25cd308742e7c6e4d39802c3469 100644 --- a/transcoder_all/layer_10_width_16k_l0_small/config.json +++ b/transcoder_all/layer_10_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_small/config.json b/transcoder_all/layer_10_width_262k_l0_small/config.json index 988d5b85b186215a23a4f858fb0384abef3158fa..a30dfc992541d157e73b9387a252b8efd4ee16f6 100644 --- a/transcoder_all/layer_10_width_262k_l0_small/config.json +++ b/transcoder_all/layer_10_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 14, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small/config.json b/transcoder_all/layer_11_width_16k_l0_small/config.json index 8bf9ab0af2866d5948c53be36cf3483f1ea10c4c..1fa69bc7850d75cc30760ab578e10d4432f14071 100644 --- a/transcoder_all/layer_11_width_16k_l0_small/config.json +++ b/transcoder_all/layer_11_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small_affine/config.json b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json index 1bdcbc28d56df4bfbc782fb41b0d333917ccfb0c..04a8d28d0ac60cec5747a870382adf8348b9be07 100644 --- a/transcoder_all/layer_11_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_11_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small/config.json b/transcoder_all/layer_11_width_262k_l0_small/config.json index 60767c0220be630cfc40e1ce0decd58d95e6e4d0..5773b225c1182dcb2d1dab359da1831e9384f928 100644 --- a/transcoder_all/layer_11_width_262k_l0_small/config.json +++ b/transcoder_all/layer_11_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_big_affine/config.json b/transcoder_all/layer_12_width_262k_l0_big_affine/config.json index 0d6d058e0d76d2bb97aa27ce411451446ea176cf..aff90030c350ca15fd7d634a44f6285d66d0b320 100644 --- a/transcoder_all/layer_12_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_12_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 94, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_small/config.json b/transcoder_all/layer_12_width_262k_l0_small/config.json index cc0a31dcd58e0d513d0db7b26a9e20ee30a37d46..51de77f428e4148c6d4831afad997c5b5aefaa7d 100644 --- a/transcoder_all/layer_12_width_262k_l0_small/config.json +++ b/transcoder_all/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_262k_l0_small_affine/config.json b/transcoder_all/layer_12_width_262k_l0_small_affine/config.json index 5f7563a06524f3314bc869265b4b9856b5567f9b..c7cf8b1e5809fc2925b83a340e09fecf61324c38 100644 --- a/transcoder_all/layer_12_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_12_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small/config.json b/transcoder_all/layer_13_width_16k_l0_small/config.json index f9af946baa99f3e2a7f04d57a9a200140fbbb622..f58307d141defaac292684895785e52ad380ef97 100644 --- a/transcoder_all/layer_13_width_16k_l0_small/config.json +++ b/transcoder_all/layer_13_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json index 91e00c743cd081c76ce47929b5ebe95020497e40..a68695012cdaaea6add354f63c6eacdc2a373265 100644 --- a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 97, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big_affine/config.json b/transcoder_all/layer_14_width_16k_l0_big_affine/config.json index 6e29bd629af6ff1b83692b8c76e446b39d195ee0..1dc06fd97512fb37158935e8111e37c303d6d619 100644 --- a/transcoder_all/layer_14_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_14_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big_affine/config.json b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json index 1d973c4068ec03725558e10422feb3f09a6db8e5..fd4a8d0ebfeeabbc6c68052d2a68afd0da733dda 100644 --- a/transcoder_all/layer_15_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_15_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 103, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_small/config.json b/transcoder_all/layer_15_width_16k_l0_small/config.json index 8df8d92273715c0baea7759b931e00112809b572..2d43494d7f465d2eea4aea77516e5a709bd5dc69 100644 --- a/transcoder_all/layer_15_width_16k_l0_small/config.json +++ b/transcoder_all/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_small_affine/config.json b/transcoder_all/layer_15_width_16k_l0_small_affine/config.json index bd67834674c4d0105d7ed01a0a0a376bb98a1e92..ef7abf7b5571e52405ac55cae8c3c25fde1c3323 100644 --- a/transcoder_all/layer_15_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_15_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big_affine/config.json b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json index 69c8d119758744d9867216656cef46ad1d67bf24..2f342bd8e74c464fe1036037decf72e756640748 100644 --- a/transcoder_all/layer_15_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 103, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_16k_l0_big_affine/config.json b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json index c160b37454550567e852eb82aa0eb3ba94ed3bbd..947e535d5b42d31cc3d321eb8737621dc505b763 100644 --- a/transcoder_all/layer_16_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_16_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 106, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_big_affine/config.json b/transcoder_all/layer_16_width_262k_l0_big_affine/config.json index 9c87078e5e1c241cd1c75e98e268bcf96667c1f1..b2c3cc671303291164b8ab5f8f0e838f1362f4f5 100644 --- a/transcoder_all/layer_16_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_16_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 106, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small/config.json b/transcoder_all/layer_16_width_262k_l0_small/config.json index f7edb3d7031d0ccac7681bdcfe5a19fa5a30cc72..1fb5de04dfdd60095b30a63caa76cea25681daec 100644 --- a/transcoder_all/layer_16_width_262k_l0_small/config.json +++ b/transcoder_all/layer_16_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 17, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big/config.json b/transcoder_all/layer_17_width_262k_l0_big/config.json index 1f42a8f8238accae1fe89e01416176afb92e4f27..1a9c3f082f616fe7290507d7529f6801875f1fc9 100644 --- a/transcoder_all/layer_17_width_262k_l0_big/config.json +++ b/transcoder_all/layer_17_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 109, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small/config.json b/transcoder_all/layer_17_width_262k_l0_small/config.json index 139f9197c7055db7c064775b134d38547d6beb59..62f0ae10764f6c01ddd0392790221ace30db9a18 100644 --- a/transcoder_all/layer_17_width_262k_l0_small/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_big_affine/config.json b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json index 4dbb58dae5fcdacea63ada40d569846c21ce0a8f..0c2e4d3f36000619472a99e810866d517fe02366 100644 --- a/transcoder_all/layer_18_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_18_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 112, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_small/config.json b/transcoder_all/layer_18_width_262k_l0_small/config.json index 4e8481ea6dcbb37c63984fc3f81e8c56fe9f511a..c5e97e590b474edcac3d6a1a554c4e69ea50c4ad 100644 --- a/transcoder_all/layer_18_width_262k_l0_small/config.json +++ b/transcoder_all/layer_18_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_18_width_262k_l0_small_affine/config.json b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json index 6901a42b4045bdf154377ed39301d0f0754e6c0e..4b4d1b6c8845d273ca6f01aad2c4b18d27b04ad7 100644 --- a/transcoder_all/layer_18_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_18_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.18.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_19_width_262k_l0_small/config.json b/transcoder_all/layer_19_width_262k_l0_small/config.json index 3b66a7175c760914e72be5ae23a4c32d91c6e2aa..5b762e338c8306c7fc5b20ed77ae67d1eaa639db 100644 --- a/transcoder_all/layer_19_width_262k_l0_small/config.json +++ b/transcoder_all/layer_19_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.19.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_small_affine/config.json b/transcoder_all/layer_1_width_16k_l0_small_affine/config.json index c1502e4863d1884f947f9d61b1ba6b28c9053206..46acdc0c8473c59fecff07331aef2692e5a124bd 100644 --- a/transcoder_all/layer_1_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_1_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_big_affine/config.json b/transcoder_all/layer_20_width_262k_l0_big_affine/config.json index ecd51895504df3afa7ee9c3aeaf7d5fd898996e4..76f9445a446c5c824a5224c4c5e67846aa37a97c 100644 --- a/transcoder_all/layer_20_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_20_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 118, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_20_width_262k_l0_small/config.json b/transcoder_all/layer_20_width_262k_l0_small/config.json index 75fb52123ab4d13bbcb346b0c5c99367f293c3f1..546cc1a9066df8789c42f9e9861532c48440196a 100644 --- a/transcoder_all/layer_20_width_262k_l0_small/config.json +++ b/transcoder_all/layer_20_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.20.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.20.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 19, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_21_width_16k_l0_small/config.json b/transcoder_all/layer_21_width_16k_l0_small/config.json index 7a3bde7b96b348b9feb1774cdca67a4269b1ec2c..4c7b1b4a000d66ceb3d8c570ac7c9d0c589a4089 100644 --- a/transcoder_all/layer_21_width_16k_l0_small/config.json +++ b/transcoder_all/layer_21_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.21.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_22_width_262k_l0_small/config.json b/transcoder_all/layer_22_width_262k_l0_small/config.json index 88bfe0984683fedb25dca6d9c60c9d0f75fa3060..3198d45850bb7c1f775598617c2e784ec6862a80 100644 --- a/transcoder_all/layer_22_width_262k_l0_small/config.json +++ b/transcoder_all/layer_22_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.22.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_16k_l0_big_affine/config.json b/transcoder_all/layer_23_width_16k_l0_big_affine/config.json index c6f6c9b664c78e0caadee249c243dadc421203e3..f937f997a985598ee44935e8fcbdc4f9c98d368a 100644 --- a/transcoder_all/layer_23_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_23_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_23_width_262k_l0_big_affine/config.json b/transcoder_all/layer_23_width_262k_l0_big_affine/config.json index 172be675b952f0396cc74866c5850bdec885d7b6..8a6843c2c0db367ed3f069c78a54bdcc22b766b8 100644 --- a/transcoder_all/layer_23_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_23_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.23.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_24_width_262k_l0_big_affine/config.json b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json index dc6f5433a967b6fca1ce85c389f752ae6980d829..6eba55f09c345d330808c4590db153e096be8569 100644 --- a/transcoder_all/layer_24_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_24_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.24.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_25_width_262k_l0_small_affine/config.json b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json index 5b32f51a81932c202ef9b64b3c556a206077d251..d84db589568cd3e614f6fd1b7458f5579be44497 100644 --- a/transcoder_all/layer_25_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_25_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.25.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_26_width_16k_l0_big_affine/config.json b/transcoder_all/layer_26_width_16k_l0_big_affine/config.json index e49381c1605af6092613d4908af5eaa90c1f58fc..80e64ed6f62fb828e848f8b2037af2e495404713 100644 --- a/transcoder_all/layer_26_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_26_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.26.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_big/config.json b/transcoder_all/layer_27_width_262k_l0_big/config.json index 4e4d28f051594a8a25ebfcd8ed56ea9f18a84e0d..db5dcdcbff29dfd804d73f254905a125209062db 100644 --- a/transcoder_all/layer_27_width_262k_l0_big/config.json +++ b/transcoder_all/layer_27_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_big_affine/config.json b/transcoder_all/layer_27_width_262k_l0_big_affine/config.json index c1f4894e88feb32f05c561d847758012a89b89aa..e8cbb1d8b5d95a16fc1c0b69be31ea5327f9b092 100644 --- a/transcoder_all/layer_27_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_27_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_27_width_262k_l0_small_affine/config.json b/transcoder_all/layer_27_width_262k_l0_small_affine/config.json index aeaf16c85832a3884d8b14d898fc78895752fe93..1386cbf9880a76a4047c92606d15f41af2811b3d 100644 --- a/transcoder_all/layer_27_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_27_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.27.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_28_width_16k_l0_small/config.json b/transcoder_all/layer_28_width_16k_l0_small/config.json index fda9ca35e10ad912ac972ac036fe2a1029947926..38c2a2516d11f4a67be373e4aa14b871b308b651 100644 --- a/transcoder_all/layer_28_width_16k_l0_small/config.json +++ b/transcoder_all/layer_28_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.28.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_16k_l0_big/config.json b/transcoder_all/layer_29_width_16k_l0_big/config.json index dd50ce55f31f6b3054e75aaad8a062a554198a75..deeb7f48fdd403fc2d1d9d6110d98d334aaaee62 100644 --- a/transcoder_all/layer_29_width_16k_l0_big/config.json +++ b/transcoder_all/layer_29_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_262k_l0_big/config.json b/transcoder_all/layer_29_width_262k_l0_big/config.json index 52c1984074d0744ade5c59ead5810ab4152d3d0a..1ea116a0a8ecde25334c31c819320d11b0daa9ec 100644 --- a/transcoder_all/layer_29_width_262k_l0_big/config.json +++ b/transcoder_all/layer_29_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_29_width_262k_l0_small/config.json b/transcoder_all/layer_29_width_262k_l0_small/config.json index 9a9869d6145259ef6caa17da14f8fd11faa8b6bd..586a63f8775db728bcc52913910ec85731e91bf4 100644 --- a/transcoder_all/layer_29_width_262k_l0_small/config.json +++ b/transcoder_all/layer_29_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.29.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_big_affine/config.json b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json index 51367afc64759f4d4ed84da87b9b406d24000b5e..997a00ba2a473c225839771b762cb2f9189de012 100644 --- a/transcoder_all/layer_2_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_2_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 65, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_30_width_16k_l0_big/config.json b/transcoder_all/layer_30_width_16k_l0_big/config.json index 45570fb89df06581c37f79c796ff1fe83beaf8ff..f59749222ff467c8c504990a0ea44ffe9573d5a9 100644 --- a/transcoder_all/layer_30_width_16k_l0_big/config.json +++ b/transcoder_all/layer_30_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.30.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_32_width_262k_l0_small/config.json b/transcoder_all/layer_32_width_262k_l0_small/config.json index e01ff3af3883797d820566e7c0691432c99bfd96..fea0ae78455fb381598de53b29c30374f7f1d7fe 100644 --- a/transcoder_all/layer_32_width_262k_l0_small/config.json +++ b/transcoder_all/layer_32_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.32.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_small/config.json b/transcoder_all/layer_33_width_262k_l0_small/config.json index 1009d7b69ae3f8a17a0093e9513b500f33ef18cc..ddcd11c486f0612ec0b2e98a2dd703b10a35b2b1 100644 --- a/transcoder_all/layer_33_width_262k_l0_small/config.json +++ b/transcoder_all/layer_33_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_33_width_262k_l0_small_affine/config.json b/transcoder_all/layer_33_width_262k_l0_small_affine/config.json index 5a4d27ea3c062ed0d1bbef646804ac1d585b4163..93e7b4eb64f5714749306148f38d1ae0e15930ce 100644 --- a/transcoder_all/layer_33_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_33_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.33.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_34_width_262k_l0_small/config.json b/transcoder_all/layer_34_width_262k_l0_small/config.json index 8d6adab8db856c8ecff5ac7788c21af807346c91..53087a899ea126da9ce56df40b63fe663b885719 100644 --- a/transcoder_all/layer_34_width_262k_l0_small/config.json +++ b/transcoder_all/layer_34_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.34.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_16k_l0_big/config.json b/transcoder_all/layer_35_width_16k_l0_big/config.json index d517e0392f803692688cb2927171146601b9a8d9..657e0023a45038c9dc12951ef7094222f78e960b 100644 --- a/transcoder_all/layer_35_width_16k_l0_big/config.json +++ b/transcoder_all/layer_35_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_35_width_262k_l0_big/config.json b/transcoder_all/layer_35_width_262k_l0_big/config.json index cf058fdb8cbecd22dca075d788b9d9679ce36f9d..2077ae7a1e71a582b43bc7d7cb5b266cfa694839 100644 --- a/transcoder_all/layer_35_width_262k_l0_big/config.json +++ b/transcoder_all/layer_35_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.35.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_36_width_16k_l0_small/config.json b/transcoder_all/layer_36_width_16k_l0_small/config.json index 41ff8a83471071612dc1c70cf2a3263233e4c044..6b11b987448ce583c4e7efe64fbb7c5f155eb770 100644 --- a/transcoder_all/layer_36_width_16k_l0_small/config.json +++ b/transcoder_all/layer_36_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.36.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_small/config.json b/transcoder_all/layer_37_width_16k_l0_small/config.json index ae7f70d8f369134246935e9d269ff34a3f8d5236..6a0812c696a667e041de0db2b850f6330dbceb71 100644 --- a/transcoder_all/layer_37_width_16k_l0_small/config.json +++ b/transcoder_all/layer_37_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_16k_l0_small_affine/config.json b/transcoder_all/layer_37_width_16k_l0_small_affine/config.json index 76d5070ad731aa5007a88fd7ed020f46b5937761..553e0bdf43ab4e036594f2125f3f7129b3873c54 100644 --- a/transcoder_all/layer_37_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_37_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_37_width_262k_l0_big_affine/config.json b/transcoder_all/layer_37_width_262k_l0_big_affine/config.json index 3c180d759cec0680e024994a6374a63c0e32f91d..8a76677a458e348c8657e92b8543763660d9522c 100644 --- a/transcoder_all/layer_37_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_37_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.37.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_16k_l0_big/config.json b/transcoder_all/layer_38_width_16k_l0_big/config.json index 327fe7456b9b162ea0b9eb7edd2725f4ff7bfa2e..bbbf7ee92aa57dc886d0b48320d05881fa9c7ad4 100644 --- a/transcoder_all/layer_38_width_16k_l0_big/config.json +++ b/transcoder_all/layer_38_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_38_width_262k_l0_big/config.json b/transcoder_all/layer_38_width_262k_l0_big/config.json index 72e465b6edbfe4dc84090a3a36f036cf83f3a6ce..bc0f6db131619d1215e0546420357b2b3af25e28 100644 --- a/transcoder_all/layer_38_width_262k_l0_big/config.json +++ b/transcoder_all/layer_38_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.38.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_39_width_16k_l0_big_affine/config.json b/transcoder_all/layer_39_width_16k_l0_big_affine/config.json index 51401013e2589ced3ac55f4536fa691605b6336c..97a209062cc0ce4fcf0ea4f940b8a0ddc8cd21c9 100644 --- a/transcoder_all/layer_39_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_39_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.39.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_16k_l0_big/config.json b/transcoder_all/layer_40_width_16k_l0_big/config.json index 9e783c885ac2f78ecc0eb0b66239156c7558ae82..3242b7f82a3e8dcdc2bc9e158386a1bfb0e9b6f9 100644 --- a/transcoder_all/layer_40_width_16k_l0_big/config.json +++ b/transcoder_all/layer_40_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_262k_l0_small/config.json b/transcoder_all/layer_40_width_262k_l0_small/config.json index e86fd6556fc5f87e8e3ee450255a130b31cb7f27..7c53e93d3b876f929998c2422ef0736a1514d7f5 100644 --- a/transcoder_all/layer_40_width_262k_l0_small/config.json +++ b/transcoder_all/layer_40_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_40_width_262k_l0_small_affine/config.json b/transcoder_all/layer_40_width_262k_l0_small_affine/config.json index e78e43c6b9fbd853e7ee691b5537b4304f3dea13..acd8f3c59fdbd313e2f4851ad1bda3c8fef2ca8b 100644 --- a/transcoder_all/layer_40_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_40_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.40.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_16k_l0_big/config.json b/transcoder_all/layer_41_width_16k_l0_big/config.json index 591e2cb6d8e168d4af1680ed36bceb7b867722b3..f71c674e92fe5ae42a930fbbf536193761b0e333 100644 --- a/transcoder_all/layer_41_width_16k_l0_big/config.json +++ b/transcoder_all/layer_41_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_16k_l0_big_affine/config.json b/transcoder_all/layer_41_width_16k_l0_big_affine/config.json index d376582bb98236a6fd7cb9fac1e0623186111988..f058f860e3ed4f532341e5cc9ae3109340a27415 100644 --- a/transcoder_all/layer_41_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_41_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_16k_l0_small/config.json b/transcoder_all/layer_41_width_16k_l0_small/config.json index 371ab83ad3c7431618c046942649736b3fbe332b..b4a9da495c770d39c3539465afb1c068048907d2 100644 --- a/transcoder_all/layer_41_width_16k_l0_small/config.json +++ b/transcoder_all/layer_41_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_41_width_262k_l0_big_affine/config.json b/transcoder_all/layer_41_width_262k_l0_big_affine/config.json index e922760ea730896c91b8c32d6b45707ec9a26d71..93c0bb4c693fc2802f8e57abdcbde930505398ab 100644 --- a/transcoder_all/layer_41_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_41_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.41.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_43_width_262k_l0_small_affine/config.json b/transcoder_all/layer_43_width_262k_l0_small_affine/config.json index db0b75701ac56d85b8086bad88ab945e56bc7603..51cc6a8959309207d3bed4e90b9cda94ef109719 100644 --- a/transcoder_all/layer_43_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_43_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.43.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_44_width_16k_l0_small_affine/config.json b/transcoder_all/layer_44_width_16k_l0_small_affine/config.json index 737cb7d021f250e954a242ef238505d30d9885e1..92299584960144a86e25fc2c37b299f2e34bba45 100644 --- a/transcoder_all/layer_44_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_44_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.44.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_47_width_262k_l0_small_affine/config.json b/transcoder_all/layer_47_width_262k_l0_small_affine/config.json index 17b8d379fe10c2cdc3a6352bbb1221203b0135db..8190f7dd1d84b4157f29543faddbbe565e4ea8f6 100644 --- a/transcoder_all/layer_47_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_47_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.47.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_49_width_16k_l0_big_affine/config.json b/transcoder_all/layer_49_width_16k_l0_big_affine/config.json index 687a5da441ab5d7236f4e489ffab46119ca2a1c8..657404c6858ca3ca8a65f34d1cac799d68df4f3f 100644 --- a/transcoder_all/layer_49_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_49_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.49.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json index e680fa0686895bc9e652eb2ad30fb29ff3510b23..8d944b2b52638d0a81e9c4df942d5dad6764c69c 100644 --- a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_16k_l0_small_affine/config.json b/transcoder_all/layer_50_width_16k_l0_small_affine/config.json index 41b9a41a7681ffcc3f8f9d1cf700f2e6fcef7564..ae3f615777af6840fb84b20fe394069dfa8dbe65 100644 --- a/transcoder_all/layer_50_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_50_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_50_width_262k_l0_small_affine/config.json b/transcoder_all/layer_50_width_262k_l0_small_affine/config.json index bbe7460260ae1b9f8134067706915fa6eda0496e..af5079334a0736ae4551efa99a3f30c6afc79fd6 100644 --- a/transcoder_all/layer_50_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_50_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.50.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_51_width_262k_l0_big/config.json b/transcoder_all/layer_51_width_262k_l0_big/config.json index b3de7c25c7177c9625c6e99bdcb808eb8b2cacf3..f7b3e253499db09ea2aa7b820045b9525a4900d7 100644 --- a/transcoder_all/layer_51_width_262k_l0_big/config.json +++ b/transcoder_all/layer_51_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.51.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_16k_l0_big_affine/config.json b/transcoder_all/layer_52_width_16k_l0_big_affine/config.json index fef8bd5ecf4c9a85c40303bdc2507b58faae1548..54123cd720cb0f5ae2a722e4b01ac30d85dcf931 100644 --- a/transcoder_all/layer_52_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_52_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_16k_l0_small/config.json b/transcoder_all/layer_52_width_16k_l0_small/config.json index cfb936f7594220081d828357f4eb8b3f3ce26b73..2b9626ed69ff01ed5a039e662b8777531264f5a0 100644 --- a/transcoder_all/layer_52_width_16k_l0_small/config.json +++ b/transcoder_all/layer_52_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_16k_l0_small_affine/config.json b/transcoder_all/layer_52_width_16k_l0_small_affine/config.json index 2eddb096105fc00c8b2fef3f7e73405dfffd412a..ca5f58ef201982a59ab2a12b9ffad04b712323e6 100644 --- a/transcoder_all/layer_52_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_52_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_52_width_262k_l0_small/config.json b/transcoder_all/layer_52_width_262k_l0_small/config.json index d910a9ac999b1662a112b88ec6d8b0c997c6e6ec..904f796a1842dcfb610fc2e68d648af0b5c3a35b 100644 --- a/transcoder_all/layer_52_width_262k_l0_small/config.json +++ b/transcoder_all/layer_52_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.52.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_262k_l0_big_affine/config.json b/transcoder_all/layer_54_width_262k_l0_big_affine/config.json index 945c4bfb012445d1e53e8a52026146383ed8e45b..76a9a316bdf7d903e7ebc43b889c050696918939 100644 --- a/transcoder_all/layer_54_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_54_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_54_width_262k_l0_small_affine/config.json b/transcoder_all/layer_54_width_262k_l0_small_affine/config.json index 6058b7ad253a97b49a032ae1bfef520be541258d..66676e944d49e44dc4095538ee77d9eec89bdffb 100644 --- a/transcoder_all/layer_54_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_54_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.54.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_55_width_16k_l0_big_affine/config.json b/transcoder_all/layer_55_width_16k_l0_big_affine/config.json index 7e50ef8a46f62278a651e460aa9ea2478518a9c5..6c2812143490b201ee5b19d741794e4247b3025d 100644 --- a/transcoder_all/layer_55_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_55_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.55.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_56_width_16k_l0_small_affine/config.json b/transcoder_all/layer_56_width_16k_l0_small_affine/config.json index 43bf3d32416b839e0ae6bcb904ca7b2576677f01..92ce56afb7e647fafb5ac6f2a456c4ef6692df7c 100644 --- a/transcoder_all/layer_56_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_56_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.56.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.56.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_big_affine/config.json b/transcoder_all/layer_57_width_16k_l0_big_affine/config.json index 80284511f23a1b279deed63eab1f46059458b3b5..dab9bac525285f8999b81df8194bd9b9ddac4318 100644 --- a/transcoder_all/layer_57_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_57_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_16k_l0_small_affine/config.json b/transcoder_all/layer_57_width_16k_l0_small_affine/config.json index 3c901788f5df1a85ee26d6122f62dce339da769b..8f4b39dfbace690719a4b704c71888aad7ece8bb 100644 --- a/transcoder_all/layer_57_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_57_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_262k_l0_big/config.json b/transcoder_all/layer_57_width_262k_l0_big/config.json index c5318bf5bcffd239be175390c26a6e7f8e011f95..3d80ffca8011278145acf3d39bc51ed55b1cd7ee 100644 --- a/transcoder_all/layer_57_width_262k_l0_big/config.json +++ b/transcoder_all/layer_57_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_57_width_262k_l0_big_affine/config.json b/transcoder_all/layer_57_width_262k_l0_big_affine/config.json index 347384184aa55f52509618113d873a901e6b6f33..1e60c1872e74c5342b059c44c98f8b82cc949a54 100644 --- a/transcoder_all/layer_57_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_57_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.57.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_16k_l0_big/config.json b/transcoder_all/layer_58_width_16k_l0_big/config.json index 91266833ed42b39665723ae51e321e393bf1c8bf..08d881732c12ca0e0c4f768e1db24cc4fbbfc0fe 100644 --- a/transcoder_all/layer_58_width_16k_l0_big/config.json +++ b/transcoder_all/layer_58_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_58_width_262k_l0_small_affine/config.json b/transcoder_all/layer_58_width_262k_l0_small_affine/config.json index 9e8f05bc71c5ff18861000ac0264663e8c26c3f1..b566c6746a6fa00c51a96e22cf0a57093e242ab5 100644 --- a/transcoder_all/layer_58_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_58_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.58.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_60_width_16k_l0_small/config.json b/transcoder_all/layer_60_width_16k_l0_small/config.json index 53e965753b5bdc4ec29cbca237ddc2fc2eeeea66..72a2cd0ddfbb93dd3834617d0522a1eb04f49779 100644 --- a/transcoder_all/layer_60_width_16k_l0_small/config.json +++ b/transcoder_all/layer_60_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.60.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_big/config.json b/transcoder_all/layer_6_width_16k_l0_big/config.json index a1e6a6e4738c45adfbfd501f220e9e8b9acfb19d..b13331b25ae4441bd4257c4f70690caa952fd185 100644 --- a/transcoder_all/layer_6_width_16k_l0_big/config.json +++ b/transcoder_all/layer_6_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 77, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_16k_l0_small_affine/config.json b/transcoder_all/layer_6_width_16k_l0_small_affine/config.json index cdc9503c33fd1a221b0842fe25d2b586985b6843..06096e9cb190840825bb17629a220348c6042452 100644 --- a/transcoder_all/layer_6_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_6_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 12, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small/config.json b/transcoder_all/layer_7_width_16k_l0_small/config.json index 542ed41f9e7afeb28f091debd4e2384aec3e9a7f..325e936c9a567268c27baed58a429e305ab816a0 100644 --- a/transcoder_all/layer_7_width_16k_l0_small/config.json +++ b/transcoder_all/layer_7_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big_affine/config.json b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json index 4ebb7eff3b32f413020ccb6782536bc2d5feceb8..2d816b437850dbca52349ffd6000951fdcd646ea 100644 --- a/transcoder_all/layer_7_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small/config.json b/transcoder_all/layer_7_width_262k_l0_small/config.json index 69b1a99ad77802d5fc81fe9bcada1d2f893811c1..55ce2553616d2fcb50ff6176d51cda11cd3f1305 100644 --- a/transcoder_all/layer_7_width_262k_l0_small/config.json +++ b/transcoder_all/layer_7_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_16k_l0_big/config.json b/transcoder_all/layer_8_width_16k_l0_big/config.json index 1c16d951b93584b757cc9efdfbc3b65e097055c0..9528ba716e07bf1dc7cd8679eedf1a255a9876d3 100644 --- a/transcoder_all/layer_8_width_16k_l0_big/config.json +++ b/transcoder_all/layer_8_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 83, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big/config.json b/transcoder_all/layer_8_width_262k_l0_big/config.json index 02bc8edd7735b9e5ec2e943dc8ef6d03576939fa..b8048acff0a3c9864c89aae64f10f0738f9e6180 100644 --- a/transcoder_all/layer_8_width_262k_l0_big/config.json +++ b/transcoder_all/layer_8_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 83, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_small_affine/config.json b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json index d4403a48bd1a2950f191f3501353a511d18d8125..b7d80ae11a7d0b1833cb41ca149bf60b5360387d 100644 --- a/transcoder_all/layer_8_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_8_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_big_affine/config.json b/transcoder_all/layer_9_width_262k_l0_big_affine/config.json index 6aa34bf3f85bcf0a5ddde663ce1059bb786351d3..a5597f81132b366acc048fb43c65d797ac390922 100644 --- a/transcoder_all/layer_9_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_9_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-27b-it", + "model_name": "google/gemma-3-27b-it", "architecture": "jump_relu", "l0": 86, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file