diff --git a/clt/width_262k_l0_big/config.json b/clt/width_262k_l0_big/config.json index e862c095410cefc1790f28b33c4e9d96ca9c92af..e7467634935e5c0743af638a46138f2683f60522 100644 --- a/clt/width_262k_l0_big/config.json +++ b/clt/width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 262080, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_262k_l0_big_affine/config.json b/clt/width_262k_l0_big_affine/config.json index 245d8bccd2d7f458e4b9de967574f479e8c79bdf..30d0f0f8ace0526b657eb10b9438d9fd4a96b190 100644 --- a/clt/width_262k_l0_big_affine/config.json +++ b/clt/width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 262080, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": true + "affine_connection": true, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_262k_l0_medium/config.json b/clt/width_262k_l0_medium/config.json index a505d728e791c07a7398d9069f198c1e5a321c6d..de0a162543ffae52b2f12664c43306b7f48f8d51 100644 --- a/clt/width_262k_l0_medium/config.json +++ b/clt/width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 262080, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 50, - "affine_connection": false + "affine_connection": false, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_262k_l0_medium_affine/config.json b/clt/width_262k_l0_medium_affine/config.json index ebef3c7344b3c85e6fc4d866591b5f01f8e9ab0d..514df5870912886d228ed493cbf4884af541e8a5 100644 --- a/clt/width_262k_l0_medium_affine/config.json +++ b/clt/width_262k_l0_medium_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 262080, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 50, - "affine_connection": true + "affine_connection": true, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_524k_l0_big/config.json b/clt/width_524k_l0_big/config.json index 0f70342a47863834ff0a300ec55a5b1442b33c3e..2bccbbf8d1995d72b6c24f9b068b3eb179740073 100644 --- a/clt/width_524k_l0_big/config.json +++ b/clt/width_524k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 524160, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_524k_l0_medium/config.json b/clt/width_524k_l0_medium/config.json index 1e61cf4a1ef24ec1138f25f60ac9d7568bdfc0ca..5a34efcdf4e4e77e5953a386cfff79511a7ab7b5 100644 --- a/clt/width_524k_l0_medium/config.json +++ b/clt/width_524k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 524160, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 50, - "affine_connection": false + "affine_connection": false, + "type": "clt" } \ No newline at end of file diff --git a/clt/width_524k_l0_medium_affine/config.json b/clt/width_524k_l0_medium_affine/config.json index e3f4e3a7b7697f90ab765d3e6c8fae418551f89c..cab462607660056238fe04828141c548733decc7 100644 --- a/clt/width_524k_l0_medium_affine/config.json +++ b/clt/width_524k_l0_medium_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 524160, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 50, - "affine_connection": true + "affine_connection": true, + "type": "clt" } \ No newline at end of file diff --git a/crosscoder/layer_5_9_12_15_width_262k_l0_big/config.json b/crosscoder/layer_5_9_12_15_width_262k_l0_big/config.json index 2990ced83e5aff935d511a4d00b0b8ce3497ba2a..ea13527029a94026237b8e84a502da4e9522b89f 100644 --- a/crosscoder/layer_5_9_12_15_width_262k_l0_big/config.json +++ b/crosscoder/layer_5_9_12_15_width_262k_l0_big/config.json @@ -1,9 +1,10 @@ { - "hf_hook_point_in": "model.layers.{5.0,9.5,12.200000000000001,15.799999999999999}.output", - "hf_hook_point_out": "model.layers.{5.0,9.5,12.200000000000001,15.799999999999999}.output", + "hf_hook_point_in": "model.layers.{5,9,12,15}.output", + "hf_hook_point_out": "model.layers.{5,9,12,15}.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "crosscoder" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_big/config.json b/mlp_out_all/layer_0_width_16k_l0_big/config.json index 38e85c69e044739a540f935d9e5d6abaf9aed390..f516216d300f047b4096b7a311029180bdb9ae8b 100644 --- a/mlp_out_all/layer_0_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_0_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_small/config.json b/mlp_out_all/layer_0_width_16k_l0_small/config.json index 925d4cb258fd9e731115f7eb806f5a9dc78593bc..ef27d95436d2179c1847a2241a49a97bf658351a 100644 --- a/mlp_out_all/layer_0_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_0_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_big/config.json b/mlp_out_all/layer_0_width_262k_l0_big/config.json index db4ea14c707ba6deccae807a994e772e9e5100a2..20877ac94f5aa6c3b45f3943c72a0e40cc7ee245 100644 --- a/mlp_out_all/layer_0_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_0_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json index 21124c6f8b1c93fe71bb5d0d9a0be630fba80455..fa02702ea874cf6fecf52f241920a0762ee56fff 100644 --- a/mlp_out_all/layer_0_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_big/config.json b/mlp_out_all/layer_10_width_16k_l0_big/config.json index 01d79dcb232b4d79bd06e03e7bdeeab9ad30f16f..f296d289841bd27ece2a41e79cd0cdae7e9e3281 100644 --- a/mlp_out_all/layer_10_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_10_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_small/config.json b/mlp_out_all/layer_10_width_16k_l0_small/config.json index c43064b216320b98f51346c6e95377e3dc493195..0df6937e11098648dc4ea904f9b92a6f41277652 100644 --- a/mlp_out_all/layer_10_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_10_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_big/config.json b/mlp_out_all/layer_10_width_262k_l0_big/config.json index 0391add096a70e40c0f99db6d85bdc6969037b36..c149e86b2ba295e31b61bcf072152cc682f0d64d 100644 --- a/mlp_out_all/layer_10_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_10_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_small/config.json b/mlp_out_all/layer_10_width_262k_l0_small/config.json index 7b1164b99437bd8140ca4bc23651a621030dfe14..cff0b0aac1409451921ac3758328a9aee42de2c6 100644 --- a/mlp_out_all/layer_10_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_10_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_big/config.json b/mlp_out_all/layer_11_width_16k_l0_big/config.json index 1a13bea3581ca9ed8c09284ee6b7ecf7ffe30edf..ded8279dfd26643b3be94e59371b95cf55d31e16 100644 --- a/mlp_out_all/layer_11_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_11_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_small/config.json b/mlp_out_all/layer_11_width_16k_l0_small/config.json index aae78685d9e0213b21ac8b35955bec2da87f8d02..eb9876fbe3db7d24e9c2852699f3ae91fd8572f0 100644 --- a/mlp_out_all/layer_11_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_11_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_262k_l0_big/config.json b/mlp_out_all/layer_11_width_262k_l0_big/config.json index 2705921fff3ddbb7bdd46dfdb0e48e9729372d0b..12513953e2493d1bb873f32d8d595cb34b756765 100644 --- a/mlp_out_all/layer_11_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_11_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_262k_l0_small/config.json b/mlp_out_all/layer_11_width_262k_l0_small/config.json index a701864c3b821a4ea4f2e5e4e1667c071f5f2826..14057ed182b69355ccaa604e761ec1ff1ca44ed5 100644 --- a/mlp_out_all/layer_11_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_11_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_16k_l0_big/config.json b/mlp_out_all/layer_12_width_16k_l0_big/config.json index bbd6aec50dda2a398d523494cfff76ae8c3b9edf..060eeded90cc481835dbb5464d0eeb156fe39cfe 100644 --- a/mlp_out_all/layer_12_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_16k_l0_small/config.json b/mlp_out_all/layer_12_width_16k_l0_small/config.json index 4699a11ca5ed92998469629a6bdb69f91f215bf1..cbbefd283fcaae255d243fcc322c89ca7cbae646 100644 --- a/mlp_out_all/layer_12_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_262k_l0_big/config.json b/mlp_out_all/layer_12_width_262k_l0_big/config.json index bec572c190f3a1ce1293a2f2173585a811c478d5..51a5f84c1fd0d8df95c6b76ae3752cdab0d31c73 100644 --- a/mlp_out_all/layer_12_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_262k_l0_small/config.json b/mlp_out_all/layer_12_width_262k_l0_small/config.json index 84f463d615920c1161012b4f8ec0ab75e19fc4ae..38d6655d03d1d102354424a1a848a1b0b2f7eb66 100644 --- a/mlp_out_all/layer_12_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_big/config.json b/mlp_out_all/layer_13_width_16k_l0_big/config.json index ac80cc0961fa3072fc05ae5eb5bbb958e1010dd0..f7ccbf01e7c9589fbf9808c791c65d36db875f50 100644 --- a/mlp_out_all/layer_13_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_13_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_small/config.json b/mlp_out_all/layer_13_width_16k_l0_small/config.json index 09e80732b55b03f0695f3a778951bf967cd98a3e..bf57ebd80ad887d4bc6d51d028f919f7998a5285 100644 --- a/mlp_out_all/layer_13_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_13_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_262k_l0_big/config.json b/mlp_out_all/layer_13_width_262k_l0_big/config.json index 96b2cb3a4645534767aeea69134315eb9fe2b043..e90b2636442461d7dec59cdc4c705f36ccb457e7 100644 --- a/mlp_out_all/layer_13_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_13_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_big/config.json b/mlp_out_all/layer_14_width_16k_l0_big/config.json index a227d4d71878e175f38ac3d85343b0e5954c8cb7..05ddb1ee06799b888eecef811175cf659cd0fc16 100644 --- a/mlp_out_all/layer_14_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_14_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_small/config.json b/mlp_out_all/layer_14_width_16k_l0_small/config.json index 456ef83f857ad98c39d6184c264b86b25d9d95a9..849ab81ec14966ee7abfa8ce56d0d99a367da097 100644 --- a/mlp_out_all/layer_14_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_14_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_big/config.json b/mlp_out_all/layer_14_width_262k_l0_big/config.json index 1bf269ef33c5a72356613bcc26ee6fd226415af2..01b49def89caf8b0980a5ff683e5392e7964c612 100644 --- a/mlp_out_all/layer_14_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_14_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_small/config.json b/mlp_out_all/layer_14_width_262k_l0_small/config.json index 7a96c0cd949fd3a354329bee9b988117c03b268e..1497053ca664f8376003d8f283bb612686e67e78 100644 --- a/mlp_out_all/layer_14_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_14_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_big/config.json b/mlp_out_all/layer_15_width_16k_l0_big/config.json index 2f22b4348c12c8a76557b6cde93fc3ff6a1de2e5..ae249fce540b3180042356cb5a8aa295c806f561 100644 --- a/mlp_out_all/layer_15_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_small/config.json b/mlp_out_all/layer_15_width_16k_l0_small/config.json index b31fdcd386bfeec459039b7ee038cb9613c133ff..31d2ddd022cbf94a09ccd07ffd5ba03d9ca59dd6 100644 --- a/mlp_out_all/layer_15_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_big/config.json b/mlp_out_all/layer_15_width_262k_l0_big/config.json index 9b936ebc8ca3b3b2697c0bb7d232988aaaf75372..641b147a14711ba747729b616ebca40d08313220 100644 --- a/mlp_out_all/layer_15_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_small/config.json b/mlp_out_all/layer_15_width_262k_l0_small/config.json index bdf4cb59b767b38f2e8f218c09a409e7919975c5..4ba48ad2cdd67d439f6922119ca09eab3ae57915 100644 --- a/mlp_out_all/layer_15_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_big/config.json b/mlp_out_all/layer_16_width_16k_l0_big/config.json index 6c301b1c9f55208e7f1c19eb98c0dc5c59ce9611..20953d7ca9bace6958d6e260633c6ae4f96986a3 100644 --- a/mlp_out_all/layer_16_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_16_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_small/config.json b/mlp_out_all/layer_16_width_262k_l0_small/config.json index 5bda8d034bbd55cbbeb9a80677b0598844108d66..937fe033043123656c06d9e00ff06457c965421e 100644 --- a/mlp_out_all/layer_16_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_16_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_big/config.json b/mlp_out_all/layer_17_width_16k_l0_big/config.json index 6cfe1f984da35e3f5fcebc2d4657c5a3ca02115b..8be7637fc7f5e870b8983aba0518cb55889b9f8c 100644 --- a/mlp_out_all/layer_17_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_17_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_16k_l0_small/config.json b/mlp_out_all/layer_17_width_16k_l0_small/config.json index 98976eabd2f05a598e6f4cea6495553df7971d77..a2d9b403938e190261e058436f444098352b59ef 100644 --- a/mlp_out_all/layer_17_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_17_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_big/config.json b/mlp_out_all/layer_17_width_262k_l0_big/config.json index 6a25cdbd3ffdc89b9d37f77ab56cfcdd3f966471..fe2c5b370a4626472e08b3310456e4cd64081d59 100644 --- a/mlp_out_all/layer_17_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_17_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_small/config.json b/mlp_out_all/layer_17_width_262k_l0_small/config.json index 5302c447211a49d3bdb9658c142ddcac3f2daa90..22a3c0eae126e90641fdf53c4b7e60e525ac31d0 100644 --- a/mlp_out_all/layer_17_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_17_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_16k_l0_big/config.json b/mlp_out_all/layer_1_width_16k_l0_big/config.json index a45d561d5cbb75b918a3d9daaf019cf2a79692ab..815db063c93454c5cdbaeebd7d0930f3f9a2daca 100644 --- a/mlp_out_all/layer_1_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_1_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 70, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_262k_l0_small/config.json b/mlp_out_all/layer_1_width_262k_l0_small/config.json index 55c839e55fc92b092c0fc1e2c69e5993f238ebad..789806372398be401a62753d21f8b4f1570640f9 100644 --- a/mlp_out_all/layer_1_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_1_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_big/config.json b/mlp_out_all/layer_2_width_16k_l0_big/config.json index 354afe925f7315e4c66620cd2a724329da0e3388..4ac27e6488b61b71c05026385855c7fd65d04b06 100644 --- a/mlp_out_all/layer_2_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_2_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_small/config.json b/mlp_out_all/layer_2_width_16k_l0_small/config.json index a1eadabf1fd49ad8a4c7eb63785bdd270010dd13..a239395deaa4317351a191615a69dab467bc7ef6 100644 --- a/mlp_out_all/layer_2_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_2_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_big/config.json b/mlp_out_all/layer_2_width_262k_l0_big/config.json index 5c6215800b3e60b93bda9f194b9ebafc3831193b..d1bc735b04f073cb8386275c623d7c02e9c9a716 100644 --- a/mlp_out_all/layer_2_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_2_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_big/config.json b/mlp_out_all/layer_3_width_16k_l0_big/config.json index b12ae3343df7d3af7486ea346a7fc327a83d8cf2..d46c3620d7f4814042e89e59318d9d634d028e64 100644 --- a/mlp_out_all/layer_3_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_3_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 90, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_small/config.json b/mlp_out_all/layer_3_width_16k_l0_small/config.json index 6309099498903c46ff7b6c3b14baa61b8b77c6bf..077123734696bd0eb7a64235046a024083f98236 100644 --- a/mlp_out_all/layer_3_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_3_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_big/config.json b/mlp_out_all/layer_3_width_262k_l0_big/config.json index a3a14408f3115c20007e6d300320c051058c39cd..8cd76d99edc88e8519133e60dd516a55db29f96f 100644 --- a/mlp_out_all/layer_3_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_3_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 90, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_small/config.json b/mlp_out_all/layer_3_width_262k_l0_small/config.json index d4e4a6b65907ac9f7055ac24a5c9b6e53d2510c9..ecea7276ddb8dfbd5b9f14015bbe9b74009637b4 100644 --- a/mlp_out_all/layer_3_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_3_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_big/config.json b/mlp_out_all/layer_4_width_16k_l0_big/config.json index 8858f5cd765df1b843dfbeac2ecc6f7aea3913d5..e5947f9133b738c2310429957a2706ba0bf06bd8 100644 --- a/mlp_out_all/layer_4_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_4_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_small/config.json b/mlp_out_all/layer_4_width_16k_l0_small/config.json index b6cf3a705271000d4237d32223bb9547cf1945d0..0535fdee2f4aa7a2e8cacb45fc84b859c5ea6b29 100644 --- a/mlp_out_all/layer_4_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_4_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_big/config.json b/mlp_out_all/layer_4_width_262k_l0_big/config.json index 3c837e095af0617ea03b8ea3e962c8000b7a4478..a42de6de733591bb2adbe7e25a69f81e31a0ab06 100644 --- a/mlp_out_all/layer_4_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_4_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_small/config.json b/mlp_out_all/layer_4_width_262k_l0_small/config.json index 4db1a192352450ff43e486221a6d17d754273851..7a5d92c4101dcff7f59ed13813c504e6f98d4a9a 100644 --- a/mlp_out_all/layer_4_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_4_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_big/config.json b/mlp_out_all/layer_5_width_16k_l0_big/config.json index 657ab9702d8a6efab69c62b341f1c6af6c8a35d5..7875281cefe32f8b4947336f32829ffae40719d7 100644 --- a/mlp_out_all/layer_5_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_small/config.json b/mlp_out_all/layer_5_width_16k_l0_small/config.json index 30b468474c5f93e9ba772fa4fbf3dab139ef0e28..102dc6957b53fa15275510abcf30a93642603f4a 100644 --- a/mlp_out_all/layer_5_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_5_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_big/config.json b/mlp_out_all/layer_5_width_262k_l0_big/config.json index a5db984e287954684b0cf38a6add2b6a8e61c21b..6d953645664fd1f168a6d45783912ecdb56625a4 100644 --- a/mlp_out_all/layer_5_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_small/config.json b/mlp_out_all/layer_5_width_262k_l0_small/config.json index c6d871f7619bcb665c395af556cc19c756025dfa..d71195302db44087c2bd53fc0cb1a01828040ef5 100644 --- a/mlp_out_all/layer_5_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_big/config.json b/mlp_out_all/layer_6_width_16k_l0_big/config.json index 6628380943582cdfafb237ede58aca81a528e4b3..3b5e37592c95db7121794341a2165c93d821ea7e 100644 --- a/mlp_out_all/layer_6_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_6_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_small/config.json b/mlp_out_all/layer_6_width_16k_l0_small/config.json index 4e617eadfa7562d031aa6f742c058ce38defe4f7..308bd4e674c270fcea44a244f0dba77d4f88e4da 100644 --- a/mlp_out_all/layer_6_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_6_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_262k_l0_big/config.json b/mlp_out_all/layer_6_width_262k_l0_big/config.json index 04472343bb8888d24899e85bcdb7d977d10305f5..4706cfc58033dfc4339d99919a45b1dfdebc1c7c 100644 --- a/mlp_out_all/layer_6_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_6_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_262k_l0_small/config.json b/mlp_out_all/layer_6_width_262k_l0_small/config.json index 69debce96460d3a7d556ef652fdade1505f0dd57..585ce1d88df494a7233d63b6f1e5faced4c277f7 100644 --- a/mlp_out_all/layer_6_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_6_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json index de12228533662a6725fa285ab0e59ca4cceb5772..6d5e1c9753ff4631181416b56bddb83916963367 100644 --- a/mlp_out_all/layer_7_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_small/config.json b/mlp_out_all/layer_7_width_16k_l0_small/config.json index 07b0878977592a5642aa5eaf69f4a2a32c32d975..bfd1cab22942e9d4bd63543795612bbc60f882fd 100644 --- a/mlp_out_all/layer_7_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_7_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_big/config.json b/mlp_out_all/layer_7_width_262k_l0_big/config.json index 9c9fabcd6f2a9bd180c77bdfbedf635a78243f89..a9107440b63c99b0ac7ce19a7f15a387a727e2dc 100644 --- a/mlp_out_all/layer_7_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_7_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_262k_l0_small/config.json b/mlp_out_all/layer_7_width_262k_l0_small/config.json index f27b01aace758faec6a920f579917e79e3695aa0..72d3720fb0cd647d0baafd54f0fba29e218b5969 100644 --- a/mlp_out_all/layer_7_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_7_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_big/config.json b/mlp_out_all/layer_8_width_16k_l0_big/config.json index c8bb5846079450ad8b9f5716fa6478dd45ede8f5..3a6e9405ba15c6fe8af9062379583ce76e68c382 100644 --- a/mlp_out_all/layer_8_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_8_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_big/config.json b/mlp_out_all/layer_8_width_262k_l0_big/config.json index 82cf14d2a44f0bcf6e40f04908067d2eec89fa7b..df7b398668ce1958e9ae6ea3f09d7636d3390ad1 100644 --- a/mlp_out_all/layer_8_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_8_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_small/config.json b/mlp_out_all/layer_8_width_262k_l0_small/config.json index b79bee202e3b5510b6ed3b9f9a2ca2843e16c6ca..62a6d71943f12473fedeee0d0b885eb2535afd22 100644 --- a/mlp_out_all/layer_8_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_8_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_16k_l0_big/config.json b/mlp_out_all/layer_9_width_16k_l0_big/config.json index e620cbcd3a6e36760b4f8cf1eee7c7c8a0bba851..345051b17d43c9ba38ebc77adc36aa9cbcda0411 100644 --- a/mlp_out_all/layer_9_width_16k_l0_big/config.json +++ b/mlp_out_all/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_16k_l0_small/config.json b/mlp_out_all/layer_9_width_16k_l0_small/config.json index 39288522b0ffab750eb98e79b80f57284e5c95a5..0732c8ffa3b4d700d9e910196d95f83b365e7573 100644 --- a/mlp_out_all/layer_9_width_16k_l0_small/config.json +++ b/mlp_out_all/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_big/config.json b/mlp_out_all/layer_9_width_262k_l0_big/config.json index 1ac7c41c4a5adcd9d64d929464ed0d67468dd9e8..bc50696e04653bd4a3ca14ca1b849149834900c5 100644 --- a/mlp_out_all/layer_9_width_262k_l0_big/config.json +++ b/mlp_out_all/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_small/config.json b/mlp_out_all/layer_9_width_262k_l0_small/config.json index 7fce4e84f82961fd495e31fdaf1f75f8c2541383..7f50a135da51072c093961bca92eecfb2f552d34 100644 --- a/mlp_out_all/layer_9_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_big/config.json b/resid_post/layer_12_width_262k_l0_big/config.json index 402067bda5e5bb88750932894d540dbd1bc4e9cb..9a4ee3f1775651ec0cc0d41e2327436b193d8fa2 100644 --- a/resid_post/layer_12_width_262k_l0_big/config.json +++ b/resid_post/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_big/config.json b/resid_post/layer_12_width_65k_l0_big/config.json index 785c3fbce60424bcb8db286d556ae27263c76ce5..99407ecd7b4800b8f4aa7db00d64cbc45f67ae83 100644 --- a/resid_post/layer_12_width_65k_l0_big/config.json +++ b/resid_post/layer_12_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_small/config.json b/resid_post/layer_15_width_16k_l0_small/config.json index a7afb89694c0ad4408513d4c47a0219f36a288c8..5b8bd009005a541d2d053517dd9fd7cbeb54a1a7 100644 --- a/resid_post/layer_15_width_16k_l0_small/config.json +++ b/resid_post/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json index 915eb4d97029b71cb8595f94ef3d077f1aa934a4..115115126f63cb8acd296e8ab332de6ed98d8523 100644 --- a/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_5_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_small/config.json b/resid_post/layer_9_width_262k_l0_small/config.json index 0239d135f60a1a6e63e30fcd683224a7378c67a3..104aa10787f197a935be5886398a89b3618f2b80 100644 --- a/resid_post/layer_9_width_262k_l0_small/config.json +++ b/resid_post/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/transcoder/layer_15_width_262k_l0_small/config.json b/transcoder/layer_15_width_262k_l0_small/config.json index 460a1dd6fa92d6430e40f1502d8f607a1e7b6538..42e4b8fe0b8b9a719811411b07455cc0bad02498 100644 --- a/transcoder/layer_15_width_262k_l0_small/config.json +++ b/transcoder/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_big/config.json b/transcoder_all/layer_0_width_16k_l0_big/config.json index bfb5494200b715f6b5485eb82b9c57d01adf4cf8..f8c303569f3f110e1a2d033482e4f63125221287 100644 --- a/transcoder_all/layer_0_width_16k_l0_big/config.json +++ b/transcoder_all/layer_0_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big/config.json b/transcoder_all/layer_0_width_262k_l0_big/config.json index 3f19b379b61ecbef563f5f60de97b6b96b09db57..0daff67a7db87f607fb045f874dbb63e2e187238 100644 --- a/transcoder_all/layer_0_width_262k_l0_big/config.json +++ b/transcoder_all/layer_0_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small/config.json b/transcoder_all/layer_0_width_262k_l0_small/config.json index 95cbb2c3ace8947e3c232ccb64b9f68e87e492f2..a0a6d5538f49c1be6755465fac83635cd705c871 100644 --- a/transcoder_all/layer_0_width_262k_l0_small/config.json +++ b/transcoder_all/layer_0_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_small_affine/config.json b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json index 6fa9a691ba5d95fd6bbef29ff05f6e4642c8b2cb..9e2e23a682317c4171ba949a79d5ab38575cf1a5 100644 --- a/transcoder_all/layer_0_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_0_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small/config.json b/transcoder_all/layer_10_width_16k_l0_small/config.json index ed003058b8ba6c078df31b4be4059e4ab6cf9b59..55d3f9de5dcb8e354fa23a42b1e3440e3db5df67 100644 --- a/transcoder_all/layer_10_width_16k_l0_small/config.json +++ b/transcoder_all/layer_10_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_small_affine/config.json b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json index d8b75cc37a65ba851bf0d4466fbd369b6943ad9e..f2d85925f9a80d0c896dfd20566ff1a11c48af84 100644 --- a/transcoder_all/layer_10_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_10_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big/config.json b/transcoder_all/layer_10_width_262k_l0_big/config.json index 5abe0c8ddb390e3eeef5e24c75db7c4a60c9c3b2..9419a54735ce062f2ce5fab17da81c3b3c2ed155 100644 --- a/transcoder_all/layer_10_width_262k_l0_big/config.json +++ b/transcoder_all/layer_10_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json index d06210222132d43cc76b782810350f1494063064..5e80e9bb88ff928865935dfe180babe2bc1a7c94 100644 --- a/transcoder_all/layer_10_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_10_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_16k_l0_small/config.json b/transcoder_all/layer_11_width_16k_l0_small/config.json index cd4c70ade12c57ff138ea11c98da45dcef6f39c2..59d8a40ca2732486cbf75c2fc28d493319d160c9 100644 --- a/transcoder_all/layer_11_width_16k_l0_small/config.json +++ b/transcoder_all/layer_11_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_big_affine/config.json b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json index e0db464fa728930a074a163276cb2df6e8c532a8..ec01cf2337097d3bfd268c2cf99297ecce0e31bf 100644 --- a/transcoder_all/layer_12_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_12_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_12_width_16k_l0_small_affine/config.json b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json index c2cfe43632fc0bfe3e8472f261911cc961bf71bc..c90439a6f509e88f53818dfbf0cfb30b2e9c63aa 100644 --- a/transcoder_all/layer_12_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_12_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json index 3256f801a534297b85dd6aa7c390fd6d520f718a..2866052b1df3e32759ab75bd8bcdc87017a70434 100644 --- a/transcoder_all/layer_13_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_13_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small/config.json b/transcoder_all/layer_13_width_16k_l0_small/config.json index 6d62704977a5db083990bdc51198ba8396e58f27..5bd0da1a3a8271c34a50f70302770264e9d3d777 100644 --- a/transcoder_all/layer_13_width_16k_l0_small/config.json +++ b/transcoder_all/layer_13_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_small_affine/config.json b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json index 7ca4249a3fbec246a4afa8a7214bde9831d5cc42..491838df19529cb9ad681d7098b6666bc51b6c02 100644 --- a/transcoder_all/layer_13_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_13_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json index d580a6473e80df7b8b5b621b9373e02bb63ede00..97295d6e6e39cd1b3fb72b9ed689f88ff9121c33 100644 --- a/transcoder_all/layer_13_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_13_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_262k_l0_small_affine/config.json b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json index c888789ece6b992b7aa396a1d1ef5dee7ea3679c..85bbd940de00e82b1f7c6a7beeda9bdc4faa97fa 100644 --- a/transcoder_all/layer_13_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_13_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_16k_l0_big/config.json b/transcoder_all/layer_14_width_16k_l0_big/config.json index c0cab431f0881f87e0aaf42717d52ca9bf78b077..bf31808eb054b8c9b0a5b048a1d3d5ca70371085 100644 --- a/transcoder_all/layer_14_width_16k_l0_big/config.json +++ b/transcoder_all/layer_14_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_14_width_262k_l0_small/config.json b/transcoder_all/layer_14_width_262k_l0_small/config.json index fb62e4ff99105aa893a2699d13fdaa02356199b6..cd4df62d9603df8985bef5a64dddc466e3e7b014 100644 --- a/transcoder_all/layer_14_width_262k_l0_small/config.json +++ b/transcoder_all/layer_14_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.14.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_16k_l0_big/config.json b/transcoder_all/layer_15_width_16k_l0_big/config.json index c0c06519438d09a80ed9aab0d88b8890a54e2cb2..3a9008a7f0d6e7c311869e6335f6c0ab4b72d453 100644 --- a/transcoder_all/layer_15_width_16k_l0_big/config.json +++ b/transcoder_all/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big/config.json b/transcoder_all/layer_15_width_262k_l0_big/config.json index 121d8791c2ee27ed3a4016a43fbc07cad0685263..3ec37680733ef99da31e6e2980d96f4c734c1da3 100644 --- a/transcoder_all/layer_15_width_262k_l0_big/config.json +++ b/transcoder_all/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json index d92c14ed876f570b8cfe9bdc2041bc4066ccca2c..f37d31a99403c93cb6ab21eef0920da3143d6dbf 100644 --- a/transcoder_all/layer_16_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_16_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.16.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big_affine/config.json b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json index a1575be27b9aab34726d3ff437c175d583b3b1a9..81db3e02fd3c4111dcd117e2a6ae259746bbf341 100644 --- a/transcoder_all/layer_17_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_17_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big/config.json b/transcoder_all/layer_17_width_262k_l0_big/config.json index 941fcfc4f71b0c5e167d5616c9cc125ed41df97e..9bd415ea3917a75c4e150656fe81baa328e36fcc 100644 --- a/transcoder_all/layer_17_width_262k_l0_big/config.json +++ b/transcoder_all/layer_17_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_big_affine/config.json b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json index 2a5b0cfa7d130bebd75ef04451af6dd21d2976be..c33b2804bba978ad5a95d83e905f33479ee9794f 100644 --- a/transcoder_all/layer_17_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_17_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small/config.json b/transcoder_all/layer_17_width_262k_l0_small/config.json index e8b8e9c4767ec151d0da8ffda060d90576b2c6fa..b94115fe29b5bb41d92e2e044827527870de3ef9 100644 --- a/transcoder_all/layer_17_width_262k_l0_small/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_16k_l0_big_affine/config.json b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json index 6dfdecc2e38ea2854c4847c607cbbbe6638aa0bf..9df07870715c11b73df91e1c3cca625f1b427fe6 100644 --- a/transcoder_all/layer_1_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_1_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 70, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_16k_l0_small_affine/config.json b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json index 3cc4af8c4408d2df86ebfa571243b4ee82f268a8..679d6c9f18ff8be168ae682caeaa755fb0248dae 100644 --- a/transcoder_all/layer_2_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_2_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small_affine/config.json b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json index 01120267e6e5cab244a329f49c04781322753643..245acb22b8d5346291ea02824a2df6cc46c451f2 100644 --- a/transcoder_all/layer_2_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_2_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_big/config.json b/transcoder_all/layer_3_width_16k_l0_big/config.json index 919c04048c090e3e14f91f76feff2b32dd65f6bf..3edd7e78b97f02b5b4db1c66f6349c200941b4da 100644 --- a/transcoder_all/layer_3_width_16k_l0_big/config.json +++ b/transcoder_all/layer_3_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 90, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small/config.json b/transcoder_all/layer_3_width_16k_l0_small/config.json index 7b8785e182f3229d2eedb5a08d11fb7d979aa924..293d92a26678d08c83adb214ae75ee14792a37bc 100644 --- a/transcoder_all/layer_3_width_16k_l0_small/config.json +++ b/transcoder_all/layer_3_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json index 44c821fa4dcb1ec7fc9daffc3187b1a6fc6996ba..e922cee00731e6acb6dab6eab24e180dfb0c103d 100644 --- a/transcoder_all/layer_3_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_3_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_big_affine/config.json b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json index 47c72ee1ba248febd2b461a6fafcccc618cf6e3a..1b88965ead2044112bc268353c5b823e04eb24d7 100644 --- a/transcoder_all/layer_3_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_3_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 90, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small/config.json b/transcoder_all/layer_3_width_262k_l0_small/config.json index 693bd173af8113336cffa1910143c6b3f69334ae..8150b613311b02862811f730f366ff062f7fb45d 100644 --- a/transcoder_all/layer_3_width_262k_l0_small/config.json +++ b/transcoder_all/layer_3_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json index 2045ae57d9bfbd03cad865cb17766720f37b525d..e3838c195a31928192e21702b356e24146f49189 100644 --- a/transcoder_all/layer_3_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_3_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.3.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 15, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json index 7be4ec58fda15e34f31c7564c503ee586a4c9c83..9b51f19d9754cddf541a032dae0461239c426fdb 100644 --- a/transcoder_all/layer_4_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big/config.json b/transcoder_all/layer_5_width_16k_l0_big/config.json index 09dda6e574c1d537fd570d17f7ebb82a7c94eef2..d2141aa3ef4073c4122556b8320de6753a805030 100644 --- a/transcoder_all/layer_5_width_16k_l0_big/config.json +++ b/transcoder_all/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_big_affine/config.json b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json index 2261d8d0a525bf6163a2a55a6646d3792ece5396..325b2463d5959b1b07770dbfe877c890566aeeb9 100644 --- a/transcoder_all/layer_5_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_5_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 110, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_16k_l0_small_affine/config.json b/transcoder_all/layer_5_width_16k_l0_small_affine/config.json index 4455a1472ec311214577a5501991bc225fa36e3e..c060218cb37e76ed187e89c5072ca424bf7d13c2 100644 --- a/transcoder_all/layer_5_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_5_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_5_width_262k_l0_big/config.json b/transcoder_all/layer_5_width_262k_l0_big/config.json index 7703397eb3a9bf112819394cacaed52e5099e343..e8047a199d42afb11d496e4974c157d958dd4be8 100644 --- a/transcoder_all/layer_5_width_262k_l0_big/config.json +++ b/transcoder_all/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 110, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_6_width_262k_l0_big_affine/config.json b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json index 14b68f87d8f69c03312bf087180a4deb868353ce..82295900e12ba55c1d885b3050a2cd588de76b8f 100644 --- a/transcoder_all/layer_6_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_6_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big/config.json b/transcoder_all/layer_7_width_262k_l0_big/config.json index 3740df3afdf9bec13dffcb9427e4c3893c75529a..76c7137f2b0628259e69f4595bbe49c63d609f82 100644 --- a/transcoder_all/layer_7_width_262k_l0_big/config.json +++ b/transcoder_all/layer_7_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small/config.json b/transcoder_all/layer_7_width_262k_l0_small/config.json index fb343ffd91fa7585fe4960f19af85dbd1a1eafd6..548672ede3d7c21dae97eb7517daf637ea1e7c15 100644 --- a/transcoder_all/layer_7_width_262k_l0_small/config.json +++ b/transcoder_all/layer_7_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_8_width_262k_l0_big/config.json b/transcoder_all/layer_8_width_262k_l0_big/config.json index 86b64c16f62cc53e32adfb7fe1cc3f7eb851aac6..90a31e3112c9bfabd3bd66290db05e5adb207600 100644 --- a/transcoder_all/layer_8_width_262k_l0_big/config.json +++ b/transcoder_all/layer_8_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.8.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_big_affine/config.json b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json index 4b9667fcc447a3099ca0b1ba675649549df262a4..839a93200cb219e33661f1bc8d3ac7c061eba795 100644 --- a/transcoder_all/layer_9_width_16k_l0_big_affine/config.json +++ b/transcoder_all/layer_9_width_16k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_big/config.json b/transcoder_all/layer_9_width_262k_l0_big/config.json index 66374ea8e78050636add4c79034b389b0078f254..cb273763692046012eadf91bd3fc9d6ef258c100 100644 --- a/transcoder_all/layer_9_width_262k_l0_big/config.json +++ b/transcoder_all/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json index d8e18e8d79d6ea5a843faa77f0d01b254da5549a..b4a0672d0eb3ca1c4e9c063ee7fc4c158fd801ca 100644 --- a/transcoder_all/layer_9_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_9_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file