diff --git a/attn_out/layer_12_width_16k_l0_big/config.json b/attn_out/layer_12_width_16k_l0_big/config.json index a1d1314c8e7d156b83b10b145fff3cc75f2dc725..7b6ed1761ba740c386cf0d3ec06ffa1fe9b95e7a 100644 --- a/attn_out/layer_12_width_16k_l0_big/config.json +++ b/attn_out/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_16k_l0_medium/config.json b/attn_out/layer_12_width_16k_l0_medium/config.json index 9a0937948ce2ac5b85fd4486f44d5c57ba6f6d0a..ff574fb5249d8c6d3f1f6021af5862f472029ed3 100644 --- a/attn_out/layer_12_width_16k_l0_medium/config.json +++ b/attn_out/layer_12_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_16k_l0_small/config.json b/attn_out/layer_12_width_16k_l0_small/config.json index 451276b588a740b897000a6570654372204d4fe3..d74a9e062b481b9374504dbe0292c4d87be85f3c 100644 --- a/attn_out/layer_12_width_16k_l0_small/config.json +++ b/attn_out/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_big/config.json b/attn_out/layer_12_width_262k_l0_big/config.json index 8d23d5aa25ee2f9b0ffe2fe9b403c944a52aeb05..4e84de99948617e0df3c4e75b1bd64b3b37241b9 100644 --- a/attn_out/layer_12_width_262k_l0_big/config.json +++ b/attn_out/layer_12_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_medium/config.json b/attn_out/layer_12_width_262k_l0_medium/config.json index f65adfd1f1d8b1e635fbfec39e6942993dea297a..5569684f69fca4570ab975189a357dcfc000594a 100644 --- a/attn_out/layer_12_width_262k_l0_medium/config.json +++ b/attn_out/layer_12_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_small/config.json b/attn_out/layer_12_width_262k_l0_small/config.json index 741fb3dc840a023a549d7ba4556198f2d475fa5d..40e71bf40da867d7ded6bca815bfb59f55c9bec1 100644 --- a/attn_out/layer_12_width_262k_l0_small/config.json +++ b/attn_out/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_65k_l0_big/config.json b/attn_out/layer_12_width_65k_l0_big/config.json index 0702595f9c217b6009c22e61799b631f19de1f1b..b40c11aab8d77777eb0d1a0fc4ac853bd54439c4 100644 --- a/attn_out/layer_12_width_65k_l0_big/config.json +++ b/attn_out/layer_12_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_12_width_65k_l0_small/config.json b/attn_out/layer_12_width_65k_l0_small/config.json index 20239143cd593fa7d0da7aec788fa5c31adfe5af..cfa99bbfba30e51dce15810cc7442a113f472764 100644 --- a/attn_out/layer_12_width_65k_l0_small/config.json +++ b/attn_out/layer_12_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_16k_l0_big/config.json b/attn_out/layer_15_width_16k_l0_big/config.json index 6af3a12f0d3c1d987590b4fe2f262c6fd39c53e1..20be2b79a67b6a979ed82b27638dcc085cbdbdfb 100644 --- a/attn_out/layer_15_width_16k_l0_big/config.json +++ b/attn_out/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_16k_l0_medium/config.json b/attn_out/layer_15_width_16k_l0_medium/config.json index 6f40db29c4ddbf409b291444766347841f9d94b3..94bce5eb4fe061f5db6681ae890fbc628e9cfbf9 100644 --- a/attn_out/layer_15_width_16k_l0_medium/config.json +++ b/attn_out/layer_15_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_16k_l0_small/config.json b/attn_out/layer_15_width_16k_l0_small/config.json index e0690184806bca6fe8d8b4596c4d85e29c3b5172..793cfdf76385fe8c3142bfb4434fcb0b9578d02b 100644 --- a/attn_out/layer_15_width_16k_l0_small/config.json +++ b/attn_out/layer_15_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_262k_l0_big/config.json b/attn_out/layer_15_width_262k_l0_big/config.json index 0275014349e3739d5189b98115f400b1899ca46b..ca0dd49c3d24f7d4159c0a504cc23902b744a041 100644 --- a/attn_out/layer_15_width_262k_l0_big/config.json +++ b/attn_out/layer_15_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_262k_l0_medium/config.json b/attn_out/layer_15_width_262k_l0_medium/config.json index 48de0de1377f404d3d0aac4126c3a1dd55083713..a04703aee3fab5fc51f6a6c672adbc04b66f9365 100644 --- a/attn_out/layer_15_width_262k_l0_medium/config.json +++ b/attn_out/layer_15_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_262k_l0_small/config.json b/attn_out/layer_15_width_262k_l0_small/config.json index b6455588e9365da4c520afd98452d761e870d6de..bbd5aff69551fbae4b8a72dd4c49fa70cc3dcc47 100644 --- a/attn_out/layer_15_width_262k_l0_small/config.json +++ b/attn_out/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_65k_l0_big/config.json b/attn_out/layer_15_width_65k_l0_big/config.json index 03815f2929ea012bfe7195776b1726542c5e0c4b..22c01289a33e11bf23021cf3716fa9699b3f2a56 100644 --- a/attn_out/layer_15_width_65k_l0_big/config.json +++ b/attn_out/layer_15_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_65k_l0_medium/config.json b/attn_out/layer_15_width_65k_l0_medium/config.json index 6d4e51ae76fb940903e6ca7469db6e5648f9a7a1..5eebb227485cc7c47eddfb16885ecee6acc31a83 100644 --- a/attn_out/layer_15_width_65k_l0_medium/config.json +++ b/attn_out/layer_15_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_15_width_65k_l0_small/config.json b/attn_out/layer_15_width_65k_l0_small/config.json index fb353d6f64ca22f2fb78027e39e9c50351530e23..30fe5a3f701656e2d4e96ec52770653beccf78fc 100644 --- a/attn_out/layer_15_width_65k_l0_small/config.json +++ b/attn_out/layer_15_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.15.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_16k_l0_big/config.json b/attn_out/layer_5_width_16k_l0_big/config.json index 1a513ff62a9fc28deb8d06a9f828d70a5e3666fa..561f8bdfeabdf49e1bbb73730de07819283601ad 100644 --- a/attn_out/layer_5_width_16k_l0_big/config.json +++ b/attn_out/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_16k_l0_medium/config.json b/attn_out/layer_5_width_16k_l0_medium/config.json index 7a9435765013190b37903c04961901e6b338ebe0..8508844c42b08c8e952772fe3be05925abdb85b1 100644 --- a/attn_out/layer_5_width_16k_l0_medium/config.json +++ b/attn_out/layer_5_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_16k_l0_small/config.json b/attn_out/layer_5_width_16k_l0_small/config.json index 489db5fbd214c1f1acb5cb5b80f7265e9ddc5ae9..d6b49b4da00bcb8bb8396bc0b875344cf9c8607f 100644 --- a/attn_out/layer_5_width_16k_l0_small/config.json +++ b/attn_out/layer_5_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_262k_l0_big/config.json b/attn_out/layer_5_width_262k_l0_big/config.json index cd81a60f9de0dfdbccfda07402199a713b7a18e7..2e19de451e9e0c0b5827fa2789cd60f4209cacad 100644 --- a/attn_out/layer_5_width_262k_l0_big/config.json +++ b/attn_out/layer_5_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_262k_l0_medium/config.json b/attn_out/layer_5_width_262k_l0_medium/config.json index 1992a10e52223a5ef92f3634358a76808a0fbe64..1fc51edd7048115cc47213b50dcfb097a1d068f8 100644 --- a/attn_out/layer_5_width_262k_l0_medium/config.json +++ b/attn_out/layer_5_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_262k_l0_small/config.json b/attn_out/layer_5_width_262k_l0_small/config.json index 9163edbfbf5100058efdde4052df2a9efb460c68..ff966ea7df9b9875c1fdce436e9220e29ec0349e 100644 --- a/attn_out/layer_5_width_262k_l0_small/config.json +++ b/attn_out/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_65k_l0_big/config.json b/attn_out/layer_5_width_65k_l0_big/config.json index 44a3ca2ef70c2f49a60833b70de4c935f8de3a47..acf694e7a00c4337757de32888376fa2a5fe572e 100644 --- a/attn_out/layer_5_width_65k_l0_big/config.json +++ b/attn_out/layer_5_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_65k_l0_medium/config.json b/attn_out/layer_5_width_65k_l0_medium/config.json index 214242e749eb326d66be6042b84da0afb5a40c90..98aace13b5f5e528074d4d8c72d3267dadfb9633 100644 --- a/attn_out/layer_5_width_65k_l0_medium/config.json +++ b/attn_out/layer_5_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_5_width_65k_l0_small/config.json b/attn_out/layer_5_width_65k_l0_small/config.json index 5479ef0cf0da3808797e482d6d45d21bfa2b7a07..4403d44d29746fafb2aba8a20e86ea3e80b1d2f6 100644 --- a/attn_out/layer_5_width_65k_l0_small/config.json +++ b/attn_out/layer_5_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_16k_l0_big/config.json b/attn_out/layer_9_width_16k_l0_big/config.json index e2be54d160a43837f5d6e56d9939d7215223c8ec..6bb9794dff0912bdf42f434123b68d4783d3a45d 100644 --- a/attn_out/layer_9_width_16k_l0_big/config.json +++ b/attn_out/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_16k_l0_medium/config.json b/attn_out/layer_9_width_16k_l0_medium/config.json index 015ca1dbc58b0f94d43c3e2b95451f4012647152..eac83c5b0d6e78f31298f3546d98948548d3ff81 100644 --- a/attn_out/layer_9_width_16k_l0_medium/config.json +++ b/attn_out/layer_9_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_16k_l0_small/config.json b/attn_out/layer_9_width_16k_l0_small/config.json index 8023ec7c5c43221f1db183a03387b368ee866e2b..2258328468803fc281c6272f8e44b7e726085350 100644 --- a/attn_out/layer_9_width_16k_l0_small/config.json +++ b/attn_out/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_262k_l0_big/config.json b/attn_out/layer_9_width_262k_l0_big/config.json index 0ddbd27e7e7c3142a6bd9a90de19eb97eb85bb81..39f9d542153c7425fdbf0618fa93e6746404d36f 100644 --- a/attn_out/layer_9_width_262k_l0_big/config.json +++ b/attn_out/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_262k_l0_medium/config.json b/attn_out/layer_9_width_262k_l0_medium/config.json index d3be8fbc5abe721a7372ef20099b8be93aa5490c..c496e1fa29307abede042cb7380f6f930ffa7e31 100644 --- a/attn_out/layer_9_width_262k_l0_medium/config.json +++ b/attn_out/layer_9_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_262k_l0_small/config.json b/attn_out/layer_9_width_262k_l0_small/config.json index d95c406aef894f2f53481ddfcb0215cdd65214ea..451cddde38ddfaa7596452d98623d62904edb479 100644 --- a/attn_out/layer_9_width_262k_l0_small/config.json +++ b/attn_out/layer_9_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_65k_l0_big/config.json b/attn_out/layer_9_width_65k_l0_big/config.json index a11cd3c007c6ab62fb5d0619bf40ce98b28d171d..14430247d31b35d6fbb41066c0ccafb6afa5c0c5 100644 --- a/attn_out/layer_9_width_65k_l0_big/config.json +++ b/attn_out/layer_9_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_65k_l0_medium/config.json b/attn_out/layer_9_width_65k_l0_medium/config.json index 61eb6d3a0f6fb652db181af89a08e592ca5f05df..44ddf16570da76a5b3772b328688160dd84a64e3 100644 --- a/attn_out/layer_9_width_65k_l0_medium/config.json +++ b/attn_out/layer_9_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out/layer_9_width_65k_l0_small/config.json b/attn_out/layer_9_width_65k_l0_small/config.json index 039857ea8cd451494ee768806f4bd37977d7cbc2..6412d7df51faaddb14a02b74e12f4533f8ad7feb 100644 --- a/attn_out/layer_9_width_65k_l0_small/config.json +++ b/attn_out/layer_9_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_12_width_16k_l0_small/config.json b/attn_out_all/layer_12_width_16k_l0_small/config.json index 451276b588a740b897000a6570654372204d4fe3..d74a9e062b481b9374504dbe0292c4d87be85f3c 100644 --- a/attn_out_all/layer_12_width_16k_l0_small/config.json +++ b/attn_out_all/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_small/config.json b/attn_out_all/layer_13_width_262k_l0_small/config.json index 31a3e469eacd4011bffaa851be004b80e638e173..f78826365f5a8bb96353fdfe52661e5cde54da8b 100644 --- a/attn_out_all/layer_13_width_262k_l0_small/config.json +++ b/attn_out_all/layer_13_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/attn_out_all/layer_6_width_262k_l0_big/config.json b/attn_out_all/layer_6_width_262k_l0_big/config.json index cb8ba364caf862a161e5d73efb374bfbb2d101ac..ef71c772a44f319013a43ace0beabfbfe15b656b 100644 --- a/attn_out_all/layer_6_width_262k_l0_big/config.json +++ b/attn_out_all/layer_6_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/clt/width_524k_l0_big_affine/config.json b/clt/width_524k_l0_big_affine/config.json index c26ea295f9ae1260ee9de94c689d663e1feed190..42b7009bbbc10050142a5296c11a3e1548dd0912 100644 --- a/clt/width_524k_l0_big_affine/config.json +++ b/clt/width_524k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output", "width": 524160, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": true + "affine_connection": true, + "type": "clt" } \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_small/config.json b/mlp_out_all/layer_2_width_262k_l0_small/config.json index 2ad96c83bd032251588c8d0c407a9c1f81a938a9..6e2c168a5866d3560cfe08dd0199325a92c43de3 100644 --- a/mlp_out_all/layer_2_width_262k_l0_small/config.json +++ b/mlp_out_all/layer_2_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_big/config.json b/resid_post/layer_12_width_16k_l0_big/config.json index 3683132d85c4dcc3b3edcc011cba9911c893ff25..c891088a45e132d01f59902b60e84df00f2bbea6 100644 --- a/resid_post/layer_12_width_16k_l0_big/config.json +++ b/resid_post/layer_12_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_medium/config.json b/resid_post/layer_12_width_16k_l0_medium/config.json index 39ce4bba4f4323b0f7dafea47d5dae9daee908a6..0780ce0f399b7b8c9f43133db3dd92b6407b1940 100644 --- a/resid_post/layer_12_width_16k_l0_medium/config.json +++ b/resid_post/layer_12_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_small/config.json b/resid_post/layer_12_width_16k_l0_small/config.json index 44fb5bb602ef875ca5c62c99117148ed6f4d54ea..6baf209588813bc55abb5312bf096b68aebd1a86 100644 --- a/resid_post/layer_12_width_16k_l0_small/config.json +++ b/resid_post/layer_12_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_medium/config.json b/resid_post/layer_12_width_1m_l0_medium/config.json index 91c41dd0350bd96c399c93e60733d585d36c1d11..0980b789f112d728f6ffec5dc5401a98ad0a7279 100644 --- a/resid_post/layer_12_width_1m_l0_medium/config.json +++ b/resid_post/layer_12_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_small/config.json b/resid_post/layer_12_width_1m_l0_small/config.json index 77a82f0821b7c2ce7c45a02c9562c86e4730e920..e96fea914f9ad7b3c72d052d511fe03c78558756 100644 --- a/resid_post/layer_12_width_1m_l0_small/config.json +++ b/resid_post/layer_12_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium/config.json b/resid_post/layer_12_width_262k_l0_medium/config.json index 31dea821f488507d12a58ae1092b58c32945b1b9..73d205aae56c736e7e47f845e2bc5a566a6b0222 100644 --- a/resid_post/layer_12_width_262k_l0_medium/config.json +++ b/resid_post/layer_12_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json index 31dea821f488507d12a58ae1092b58c32945b1b9..73d205aae56c736e7e47f845e2bc5a566a6b0222 100644 --- a/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_small/config.json b/resid_post/layer_12_width_262k_l0_small/config.json index edfb70326bb6c2a56bc361d33d0680b8d6a03322..65b2920dd4e8c4ca161c4db3986c3a849cccf576 100644 --- a/resid_post/layer_12_width_262k_l0_small/config.json +++ b/resid_post/layer_12_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_medium/config.json b/resid_post/layer_12_width_65k_l0_medium/config.json index 55aaeb80f6164df2e0bf3388b4f7f2bfdb609954..1ef70881a3bec7f1fa0c72a9004285c91eb4e95c 100644 --- a/resid_post/layer_12_width_65k_l0_medium/config.json +++ b/resid_post/layer_12_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.12.output", "hf_hook_point_out": "model.layers.12.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_big/config.json b/resid_post/layer_15_width_16k_l0_big/config.json index 4b2763b9f9d20ba119000f66a6be024d7f030fdd..5484ea196efc80945febb5ea59446964806f3dc2 100644 --- a/resid_post/layer_15_width_16k_l0_big/config.json +++ b/resid_post/layer_15_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_16k_l0_medium/config.json b/resid_post/layer_15_width_16k_l0_medium/config.json index 46dfdb44b3ad3d1ae90645edbd4265c20f88eef6..2c727768645250ee0b35bf2732c4db8220598f13 100644 --- a/resid_post/layer_15_width_16k_l0_medium/config.json +++ b/resid_post/layer_15_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_big/config.json b/resid_post/layer_15_width_1m_l0_big/config.json index 32cd957267ffa0a360ff95d4dd3619ab118c77e1..77eb975cb5796e145449f6b65afd97b3d71d3a2b 100644 --- a/resid_post/layer_15_width_1m_l0_big/config.json +++ b/resid_post/layer_15_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_medium/config.json b/resid_post/layer_15_width_1m_l0_medium/config.json index 79682a319ea7f96583ff4f44653e6f5f04b5738e..f9659973bd9d102832c3287c23c09c520ef860fc 100644 --- a/resid_post/layer_15_width_1m_l0_medium/config.json +++ b/resid_post/layer_15_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_1m_l0_small/config.json b/resid_post/layer_15_width_1m_l0_small/config.json index 7e42c0e103be9bc459511689a8270eb903dc3e6e..e03c60286444be9fa37611c86d776a455751aaa4 100644 --- a/resid_post/layer_15_width_1m_l0_small/config.json +++ b/resid_post/layer_15_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_medium/config.json b/resid_post/layer_15_width_262k_l0_medium/config.json index 6d90861f88041245668e920153151e8a96e68546..efbac0c7b30077fadd0864ef9a3f6add379eb9ea 100644 --- a/resid_post/layer_15_width_262k_l0_medium/config.json +++ b/resid_post/layer_15_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json index 6d90861f88041245668e920153151e8a96e68546..efbac0c7b30077fadd0864ef9a3f6add379eb9ea 100644 --- a/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_15_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_262k_l0_small/config.json b/resid_post/layer_15_width_262k_l0_small/config.json index 1784681b5c5383ee3e0ea37acd011e1bd5329dd9..853279b4bfc8739833f2d08687d0f7f556cd6019 100644 --- a/resid_post/layer_15_width_262k_l0_small/config.json +++ b/resid_post/layer_15_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_big/config.json b/resid_post/layer_15_width_65k_l0_big/config.json index 7ce74b7c83664554e1936e3f7018899b799f06ac..5ebb1ea06a37261d45e119100dc994d01c45b9a3 100644 --- a/resid_post/layer_15_width_65k_l0_big/config.json +++ b/resid_post/layer_15_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_medium/config.json b/resid_post/layer_15_width_65k_l0_medium/config.json index 17e599b82087479cb2d649d13ad228129e8d6d93..eb779e94fde371b695c4c1fd47c9d643463002d8 100644 --- a/resid_post/layer_15_width_65k_l0_medium/config.json +++ b/resid_post/layer_15_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_15_width_65k_l0_small/config.json b/resid_post/layer_15_width_65k_l0_small/config.json index cf79f9fc124917a09e61cf04329c0083fd04af38..18c52324d5daf92fc833be00b3b04b41d16b7faa 100644 --- a/resid_post/layer_15_width_65k_l0_small/config.json +++ b/resid_post/layer_15_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.output", "hf_hook_point_out": "model.layers.15.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_16k_l0_big/config.json b/resid_post/layer_5_width_16k_l0_big/config.json index 7b1510b6d8300833cb2c645048a0eadb5db3edd7..08cc9782a6b0d3ea2f68d6a203c38f335634a134 100644 --- a/resid_post/layer_5_width_16k_l0_big/config.json +++ b/resid_post/layer_5_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_16k_l0_medium/config.json b/resid_post/layer_5_width_16k_l0_medium/config.json index c65dbc3be13bdcf328cdbe83d17b28c2d9afe141..bacec507b0d68cfe12109083ec6ef1d62ab9d711 100644 --- a/resid_post/layer_5_width_16k_l0_medium/config.json +++ b/resid_post/layer_5_width_16k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_big/config.json b/resid_post/layer_5_width_1m_l0_big/config.json index bb8d3bc66ffc67619031fce85fc837b33e412ea9..607bbf379d53ce5be69213b603c0587a64b64600 100644 --- a/resid_post/layer_5_width_1m_l0_big/config.json +++ b/resid_post/layer_5_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_medium/config.json b/resid_post/layer_5_width_1m_l0_medium/config.json index ee277683b775dcc690bf35526cd9b2483b4cf48b..f765f6973a4efaa0c3d5a641aa9e87bf32cf4646 100644 --- a/resid_post/layer_5_width_1m_l0_medium/config.json +++ b/resid_post/layer_5_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_1m_l0_small/config.json b/resid_post/layer_5_width_1m_l0_small/config.json index 786e883eb0b6f1d9b773a985f5085a8641d4fbeb..60ae8948ca009ce592ecff04184f48722c54956e 100644 --- a/resid_post/layer_5_width_1m_l0_small/config.json +++ b/resid_post/layer_5_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_medium/config.json b/resid_post/layer_5_width_262k_l0_medium/config.json index 915eb4d97029b71cb8595f94ef3d077f1aa934a4..115115126f63cb8acd296e8ab332de6ed98d8523 100644 --- a/resid_post/layer_5_width_262k_l0_medium/config.json +++ b/resid_post/layer_5_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_262k_l0_small/config.json b/resid_post/layer_5_width_262k_l0_small/config.json index 194d500026bbd9f11659abae4e55a7d88dc66121..6762e1ffc3d97e1bb04afb474b2fc36bf82d2d7f 100644 --- a/resid_post/layer_5_width_262k_l0_small/config.json +++ b/resid_post/layer_5_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_big/config.json b/resid_post/layer_5_width_65k_l0_big/config.json index 216093c699c970ce5ba8a2b985aaf7d4aacd3ff1..9a9fb5c3cfe974c044a213135f68f243105de5d7 100644 --- a/resid_post/layer_5_width_65k_l0_big/config.json +++ b/resid_post/layer_5_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 135, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_medium/config.json b/resid_post/layer_5_width_65k_l0_medium/config.json index 4ff3a63c6aa753f443316df70b6e3187e03fc9d9..b79576e65198097edc8f4c01c62e0d9f9bc70d4c 100644 --- a/resid_post/layer_5_width_65k_l0_medium/config.json +++ b/resid_post/layer_5_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_5_width_65k_l0_small/config.json b/resid_post/layer_5_width_65k_l0_small/config.json index 52c2877c1f5654bef212da837ac4decb320a13ca..2ac09f91daf9c66ff520be27e24e309c768bf014 100644 --- a/resid_post/layer_5_width_65k_l0_small/config.json +++ b/resid_post/layer_5_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.output", "hf_hook_point_out": "model.layers.5.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 18, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_big/config.json b/resid_post/layer_9_width_16k_l0_big/config.json index 39211eb607165857ba1b3b601997c3349ff2a470..6179ddd1e40885c315f56f196d6319a9ddd6592e 100644 --- a/resid_post/layer_9_width_16k_l0_big/config.json +++ b/resid_post/layer_9_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_big/config.json b/resid_post/layer_9_width_1m_l0_big/config.json index 08c77028d369bfc6e8e890dda14085097091fa86..a1bbd92f71fa6251704be7ae906b9fb89c8d279b 100644 --- a/resid_post/layer_9_width_1m_l0_big/config.json +++ b/resid_post/layer_9_width_1m_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_medium/config.json b/resid_post/layer_9_width_1m_l0_medium/config.json index 23cb7fc6b296dd8e08bcd7b92fb1eeb3928fa2ed..7bc969cf5e3d632ab80175d401fd4deaf0aad253 100644 --- a/resid_post/layer_9_width_1m_l0_medium/config.json +++ b/resid_post/layer_9_width_1m_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_1m_l0_small/config.json b/resid_post/layer_9_width_1m_l0_small/config.json index 9d9beae8b5747f01e00b88cd8fe485c32855951f..378ad96e08b2c47ef0001d773dce0c0bb49cf20c 100644 --- a/resid_post/layer_9_width_1m_l0_small/config.json +++ b/resid_post/layer_9_width_1m_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 1048576, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_big/config.json b/resid_post/layer_9_width_262k_l0_big/config.json index d98cac4a54524fb1f80fd80d5ad3d8aee3816541..b18438d330bf26f22afdd79d9aee480ce39fc4b0 100644 --- a/resid_post/layer_9_width_262k_l0_big/config.json +++ b/resid_post/layer_9_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium/config.json b/resid_post/layer_9_width_262k_l0_medium/config.json index c84bdf94f21d49231a23ee9189c7f5c2295f750f..acf62f17960d4d805e04b518dad43d442f128991 100644 --- a/resid_post/layer_9_width_262k_l0_medium/config.json +++ b/resid_post/layer_9_width_262k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json index c84bdf94f21d49231a23ee9189c7f5c2295f750f..acf62f17960d4d805e04b518dad43d442f128991 100644 --- a/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json +++ b/resid_post/layer_9_width_262k_l0_medium_seed_1/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_big/config.json b/resid_post/layer_9_width_65k_l0_big/config.json index 930acfef07df024f388b6287c15ec3fea6ee4a89..b41b7e21a43d8bc1022d5c392bad2d60a6a09bbb 100644 --- a/resid_post/layer_9_width_65k_l0_big/config.json +++ b/resid_post/layer_9_width_65k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 150, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_medium/config.json b/resid_post/layer_9_width_65k_l0_medium/config.json index 05417ed7572f02df2718f11b5eaecd671a32f990..b3448eec256ed91cd1d644d4e39c48785cb59a18 100644 --- a/resid_post/layer_9_width_65k_l0_medium/config.json +++ b/resid_post/layer_9_width_65k_l0_medium/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_small/config.json b/resid_post/layer_9_width_65k_l0_small/config.json index 49972ad186969651da139883e2361b58a522823e..a34dfc07a3abef717059b0f4391393560c5703d2 100644 --- a/resid_post/layer_9_width_65k_l0_small/config.json +++ b/resid_post/layer_9_width_65k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.output", "hf_hook_point_out": "model.layers.9.output", "width": 65536, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "sae" } \ No newline at end of file diff --git a/transcoder/layer_5_width_262k_l0_medium_affine/config.json b/transcoder/layer_5_width_262k_l0_medium_affine/config.json index c9d0ea15cdae62926fe8ffef075f78d0d9e5cb1e..db5dcb159f2cb265c574385f59a20c00e496f2cc 100644 --- a/transcoder/layer_5_width_262k_l0_medium_affine/config.json +++ b/transcoder/layer_5_width_262k_l0_medium_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.5.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 55, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_16k_l0_small/config.json b/transcoder_all/layer_0_width_16k_l0_small/config.json index 8a50a6964867dd0d99d0268d0a352fa5780cf17d..4cb2f011e3e62442e63b5c01aa61dc901281a65e 100644 --- a/transcoder_all/layer_0_width_16k_l0_small/config.json +++ b/transcoder_all/layer_0_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 10, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_0_width_262k_l0_big_affine/config.json b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json index c61b4e0265ea7c886da3848f3b38affce4cae5b0..f03e75d64a8dd4fe45f2fbcd5c0fbf4e36c7ac95 100644 --- a/transcoder_all/layer_0_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_0_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.0.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 60, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_10_width_16k_l0_big/config.json b/transcoder_all/layer_10_width_16k_l0_big/config.json index ebb20520fb3c46e530456245ad47a5d943196983..dee06d6bd9cc2aabad486cac6320a9b05143418d 100644 --- a/transcoder_all/layer_10_width_16k_l0_big/config.json +++ b/transcoder_all/layer_10_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.10.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_11_width_262k_l0_small/config.json b/transcoder_all/layer_11_width_262k_l0_small/config.json index 6002baeac7f0af73750d97b4107120583ec7902f..22d0d6b404ae95c9222c36884286e33a312c95bc 100644 --- a/transcoder_all/layer_11_width_262k_l0_small/config.json +++ b/transcoder_all/layer_11_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.11.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_13_width_16k_l0_big/config.json b/transcoder_all/layer_13_width_16k_l0_big/config.json index 8ad972a9d5d48eadfba8266f43f52b35d5681d78..a21163987a85c3a8f2cc57b5aff53c70f746618a 100644 --- a/transcoder_all/layer_13_width_16k_l0_big/config.json +++ b/transcoder_all/layer_13_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.13.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_15_width_262k_l0_big_affine/config.json b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json index 1d4b82f47cd72259203f5e9587ab1fbe54fb481f..e6d42df44482fc6a3d7a6c3038f45a463a3cef30 100644 --- a/transcoder_all/layer_15_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_15_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.15.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_16k_l0_big/config.json b/transcoder_all/layer_17_width_16k_l0_big/config.json index 6b7c0a04ae3c37424c7e6e1fe8e6d609b1f15a4a..9850f422e35460c6cb52a3b5478416a6c4494a8b 100644 --- a/transcoder_all/layer_17_width_16k_l0_big/config.json +++ b/transcoder_all/layer_17_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json index 96aaf0ab21c8e07be8e6c53079db95c3c1549009..918de468f89136b48f1ab38a6bd4cb33b72ceb05 100644 --- a/transcoder_all/layer_17_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_17_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.17.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json index 77c0db3d07fcf6264ed0b00e3feba33186e2d9da..8a7d3ee9da4e0ef813e33d82f34ab1a9c3c6e934 100644 --- a/transcoder_all/layer_1_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_1_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.1.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 11, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_big/config.json b/transcoder_all/layer_2_width_262k_l0_big/config.json index 2cac582fa63a4bcfa44182778af8499588f4222c..d72a54d06562d3a5cda2b618f7b446796d0b1089 100644 --- a/transcoder_all/layer_2_width_262k_l0_big/config.json +++ b/transcoder_all/layer_2_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 80, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_2_width_262k_l0_small/config.json b/transcoder_all/layer_2_width_262k_l0_small/config.json index b62a87f01c2dbb1be7117ebd7c81eef1e2cfac3d..f0b4b8e113a2dea36dfcca71a81cf713b4adb7a8 100644 --- a/transcoder_all/layer_2_width_262k_l0_small/config.json +++ b/transcoder_all/layer_2_width_262k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.2.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 13, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_16k_l0_big/config.json b/transcoder_all/layer_4_width_16k_l0_big/config.json index 94ce2b67457dfafa5709afadf2b825a06f76a75f..a091a9d1ab659031f781d2dfb8b0744891eb206b 100644 --- a/transcoder_all/layer_4_width_16k_l0_big/config.json +++ b/transcoder_all/layer_4_width_16k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_big/config.json b/transcoder_all/layer_4_width_262k_l0_big/config.json index f1d6945875f713b1c644dab5f3a72afd2ef30f57..a7fa98c97c09b105a62b08227345fc698f5a5274 100644 --- a/transcoder_all/layer_4_width_262k_l0_big/config.json +++ b/transcoder_all/layer_4_width_262k_l0_big/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 100, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json index 1a3460dc093827776e0ce13f10727dec4c0552cf..4d5c3c8914a7ae0b4b28cc41897352bab359095f 100644 --- a/transcoder_all/layer_4_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_4_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.4.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 16, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json index 7cec02f803c70771951243e8bc6923860e0f0b72..068e73402ff1a5347155b64f65d26fec52e6c220 100644 --- a/transcoder_all/layer_7_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_7_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_big_affine/config.json b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json index 442dfdae04f2ab648e8e304d95803c889b0ddef3..d6bc65fe9e140f07d1d7c3909f363bade952c18b 100644 --- a/transcoder_all/layer_7_width_262k_l0_big_affine/config.json +++ b/transcoder_all/layer_7_width_262k_l0_big_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 120, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_7_width_262k_l0_small_affine/config.json b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json index b0f6302935058034ec8e5b04be9e3d566043a404..932642a0d7d4202e6cd33836e9c4b0d20fc8ee97 100644 --- a/transcoder_all/layer_7_width_262k_l0_small_affine/config.json +++ b/transcoder_all/layer_7_width_262k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.7.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", "width": 262144, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small/config.json b/transcoder_all/layer_9_width_16k_l0_small/config.json index 84836a0a310a8691331512b48d1bc6f689925012..38b3530a54d339fe15b0dec6f196b5f6e3d65083 100644 --- a/transcoder_all/layer_9_width_16k_l0_small/config.json +++ b/transcoder_all/layer_9_width_16k_l0_small/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": false + "affine_connection": false, + "type": "transcoder" } \ No newline at end of file diff --git a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json index 4ea0330788c25238d6244aa55b4c0a08f9389aab..d9ff66d963f58c4d14e1a73cf56759bea0a4f486 100644 --- a/transcoder_all/layer_9_width_16k_l0_small_affine/config.json +++ b/transcoder_all/layer_9_width_16k_l0_small_affine/config.json @@ -2,8 +2,9 @@ "hf_hook_point_in": "model.layers.9.pre_feedforward_layernorm.output", "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", "width": 16384, - "model_name": "gemma-v3-270m-it", + "model_name": "google/gemma-3-270m-it", "architecture": "jump_relu", "l0": 20, - "affine_connection": true + "affine_connection": true, + "type": "transcoder" } \ No newline at end of file