diff --git a/attn_out/layer_12_width_16k_l0_big/config.json b/attn_out/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..90bfa81c65ba1cf5be11e5d08a6c379251129610 --- /dev/null +++ b/attn_out/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_16k_l0_medium/config.json b/attn_out/layer_12_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0dfb873da76c3af921d6033c5c77d8d3f66e0f7 --- /dev/null +++ b/attn_out/layer_12_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_16k_l0_small/config.json b/attn_out/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b6e0d195b3f334100bbdb0838bb295d054faf48 --- /dev/null +++ b/attn_out/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_big/config.json b/attn_out/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..80bc18fe54c551a85cb3bee37e612ec7713a2876 --- /dev/null +++ b/attn_out/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_medium/config.json b/attn_out/layer_12_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8e1594526d80ac34ffd03e410494ff4c66d2d504 --- /dev/null +++ b/attn_out/layer_12_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_262k_l0_small/config.json b/attn_out/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c59fcf1be0b6bd2b815919ead63b1a7b1137336 --- /dev/null +++ b/attn_out/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_65k_l0_big/config.json b/attn_out/layer_12_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..439bac5ac37e21476e77b82c9520fc4ad6b4f8c7 --- /dev/null +++ b/attn_out/layer_12_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_65k_l0_medium/config.json b/attn_out/layer_12_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c7288987ed02f2cd010457a1cca927b552e7231d --- /dev/null +++ b/attn_out/layer_12_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_12_width_65k_l0_small/config.json b/attn_out/layer_12_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ac500981ab1c22278eac1b9ec33ae9cfa338865c --- /dev/null +++ b/attn_out/layer_12_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_16k_l0_big/config.json b/attn_out/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b88edff7d083a0cffef9064659358a75076a94b1 --- /dev/null +++ b/attn_out/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_16k_l0_medium/config.json b/attn_out/layer_24_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32bc3dcfa1e41e2b2f850c6c080a88c87baf7277 --- /dev/null +++ b/attn_out/layer_24_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_16k_l0_small/config.json b/attn_out/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..349fc0b43840bc964dc80a350b725ae93795e1a6 --- /dev/null +++ b/attn_out/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_262k_l0_big/config.json b/attn_out/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b105809d316fb412ba73a80d0f2ff719676d9b1 --- /dev/null +++ b/attn_out/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_262k_l0_medium/config.json b/attn_out/layer_24_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..768a9ced2fc0a68c398f7478791292845c2a36ab --- /dev/null +++ b/attn_out/layer_24_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_262k_l0_small/config.json b/attn_out/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5851c804c67769f99288a6b5473d6eb16ac4ed33 --- /dev/null +++ b/attn_out/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_65k_l0_big/config.json b/attn_out/layer_24_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea7b7275cdaa3691939af7ee89e2746c3f22493d --- /dev/null +++ b/attn_out/layer_24_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_65k_l0_medium/config.json b/attn_out/layer_24_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..495f1fe3bb763f46531c0d2b6f2e32385676350e --- /dev/null +++ b/attn_out/layer_24_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_24_width_65k_l0_small/config.json b/attn_out/layer_24_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9d26e29b206480ec02bf928c2dc209b395be967b --- /dev/null +++ b/attn_out/layer_24_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_16k_l0_big/config.json b/attn_out/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cb42ca5f4e8cd66d8ee8401d678cf1bc45ef6283 --- /dev/null +++ b/attn_out/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_16k_l0_medium/config.json b/attn_out/layer_31_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb367185b67d4a9be9016326a86c798106be6eb --- /dev/null +++ b/attn_out/layer_31_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_16k_l0_small/config.json b/attn_out/layer_31_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..85e056efb8a07e55fc709ec173e84267d0ac77e1 --- /dev/null +++ b/attn_out/layer_31_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_262k_l0_big/config.json b/attn_out/layer_31_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..794284995506eb541ca3d9da25b4aa3b5138b604 --- /dev/null +++ b/attn_out/layer_31_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_262k_l0_medium/config.json b/attn_out/layer_31_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5dd10034367978b38ff152c6439750e06c3937 --- /dev/null +++ b/attn_out/layer_31_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_262k_l0_small/config.json b/attn_out/layer_31_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b4a3d28da5660f6a9b8a9133fec08d6f9e184dd9 --- /dev/null +++ b/attn_out/layer_31_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_65k_l0_big/config.json b/attn_out/layer_31_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..71f895289ff8b7356dc4a53af95c1b1032c78f47 --- /dev/null +++ b/attn_out/layer_31_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_65k_l0_medium/config.json b/attn_out/layer_31_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2b39b428ed82c32425a1b9064131d586850b3b44 --- /dev/null +++ b/attn_out/layer_31_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_31_width_65k_l0_small/config.json b/attn_out/layer_31_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6255fd8202f4dbc6518e2a521c0ad8fc19da26 --- /dev/null +++ b/attn_out/layer_31_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.31.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_16k_l0_big/config.json b/attn_out/layer_41_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..190a0c2dd318a94761044a2aeb17f58c415c352d --- /dev/null +++ b/attn_out/layer_41_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_16k_l0_medium/config.json b/attn_out/layer_41_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d95553a3ff81aa8ff099d3936ef92ac95ed3e068 --- /dev/null +++ b/attn_out/layer_41_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_16k_l0_small/config.json b/attn_out/layer_41_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7dcda3037c3980f1b3350bacf26d5e575e61fe17 --- /dev/null +++ b/attn_out/layer_41_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_262k_l0_big/config.json b/attn_out/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ed4be4d63dfd8669ecaeb23ae7658d7af5844886 --- /dev/null +++ b/attn_out/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_262k_l0_medium/config.json b/attn_out/layer_41_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd730a10cbb2627d804484071edefb107e61ad1d --- /dev/null +++ b/attn_out/layer_41_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_262k_l0_small/config.json b/attn_out/layer_41_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2aeab0170ad0e398b1b8844acbdebae89e0738c3 --- /dev/null +++ b/attn_out/layer_41_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_65k_l0_big/config.json b/attn_out/layer_41_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..345a5305ccb4050a83a81192733f88ec6b9eba8e --- /dev/null +++ b/attn_out/layer_41_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_65k_l0_medium/config.json b/attn_out/layer_41_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ea4fd2d6528f6dc3e5271025bdf11f2a9df0ede8 --- /dev/null +++ b/attn_out/layer_41_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out/layer_41_width_65k_l0_small/config.json b/attn_out/layer_41_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5e7dbf66d9853be71db25942cfad4fd6523a2ae0 --- /dev/null +++ b/attn_out/layer_41_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.41.self_attn.o_proj.input", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_big/config.json b/resid_post/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b814655f188ff3b597391556d07d9b189691087 --- /dev/null +++ b/resid_post/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_medium/config.json b/resid_post/layer_12_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..05ae3ad6bd93f33c4de0c51c34a2aa421506c26c --- /dev/null +++ b/resid_post/layer_12_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_16k_l0_small/config.json b/resid_post/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b346eb4ecabd7bb1f7e062965ff14a16145b0959 --- /dev/null +++ b/resid_post/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_big/config.json b/resid_post/layer_12_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bbd3350fb7ccc7f655ab6ab687c585a9e68f5f0b --- /dev/null +++ b/resid_post/layer_12_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_medium/config.json b/resid_post/layer_12_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e53f008d48553b6802fec675c6edf9fd9a331dce --- /dev/null +++ b/resid_post/layer_12_width_1m_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_1m_l0_small/config.json b/resid_post/layer_12_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..12d3b3d893846da4da327a2f716b53c749b3b6ca --- /dev/null +++ b/resid_post/layer_12_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_big/config.json b/resid_post/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5489b61f897bbf7cf1ff924398856ac7d50ae19d --- /dev/null +++ b/resid_post/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium/config.json b/resid_post/layer_12_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b3328a2f790f83fbd7c89731fef038304acb96 --- /dev/null +++ b/resid_post/layer_12_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b3328a2f790f83fbd7c89731fef038304acb96 --- /dev/null +++ b/resid_post/layer_12_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_262k_l0_small/config.json b/resid_post/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c15f43f3932864dd90c01aed514aec7d70804e7 --- /dev/null +++ b/resid_post/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_medium/config.json b/resid_post/layer_12_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..73862001e07abcff7030a9fcf7c64c2757feaaff --- /dev/null +++ b/resid_post/layer_12_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_12_width_65k_l0_small/config.json b/resid_post/layer_12_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..374d1d1142b46eb5426771c960884dcf94423c12 --- /dev/null +++ b/resid_post/layer_12_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_16k_l0_big/config.json b/resid_post/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7c2a51deb84d88d07e496a4c1eb8fa6a7bc7dd0c --- /dev/null +++ b/resid_post/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_1m_l0_big/config.json b/resid_post/layer_24_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe3a0782f4c1bd779630d64fb9a760454b0928b8 --- /dev/null +++ b/resid_post/layer_24_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_1m_l0_medium/config.json b/resid_post/layer_24_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5274f37d6640926051062ddf53e34a399d577df2 --- /dev/null +++ b/resid_post/layer_24_width_1m_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_1m_l0_small/config.json b/resid_post/layer_24_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fe3568b7c03e57bdff6ca940cbd752a94cc1c672 --- /dev/null +++ b/resid_post/layer_24_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_262k_l0_big/config.json b/resid_post/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..149b79c0e271f4fab46173a058d4e31f2908cf62 --- /dev/null +++ b/resid_post/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_262k_l0_medium/config.json b/resid_post/layer_24_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b80f31573d838063ebceaf43ea525d9f3a762375 --- /dev/null +++ b/resid_post/layer_24_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_24_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b80f31573d838063ebceaf43ea525d9f3a762375 --- /dev/null +++ b/resid_post/layer_24_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_262k_l0_small/config.json b/resid_post/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3c586069f7697542702cd59428224887c5eda351 --- /dev/null +++ b/resid_post/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_65k_l0_big/config.json b/resid_post/layer_24_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..68284ed5e5424d7268fb6909a296d6534ce97a55 --- /dev/null +++ b/resid_post/layer_24_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_65k_l0_medium/config.json b/resid_post/layer_24_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b14c9d3f5ab73c2aad0a6a7932933b09c2e2ebd --- /dev/null +++ b/resid_post/layer_24_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_24_width_65k_l0_small/config.json b/resid_post/layer_24_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6b3cc6ce893f9d097c4e5dd1282c3d4ef73e56a7 --- /dev/null +++ b/resid_post/layer_24_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_16k_l0_big/config.json b/resid_post/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3d5c546ff9e8dfab5330f4494dad11160e9601a0 --- /dev/null +++ b/resid_post/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_16k_l0_small/config.json b/resid_post/layer_31_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef18a64e8345801844017f4d02d75727b87df872 --- /dev/null +++ b/resid_post/layer_31_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_1m_l0_big/config.json b/resid_post/layer_31_width_1m_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c50275dc0b9ecd80f55e6c1c514b58ac9d00ae5d --- /dev/null +++ b/resid_post/layer_31_width_1m_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_1m_l0_medium/config.json b/resid_post/layer_31_width_1m_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..055508cc314c323c36e36df555f24b58adabfde5 --- /dev/null +++ b/resid_post/layer_31_width_1m_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_262k_l0_medium/config.json b/resid_post/layer_31_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b67421c62bd2b34ce93bedf0bf8f31ea270dca71 --- /dev/null +++ b/resid_post/layer_31_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_65k_l0_big/config.json b/resid_post/layer_31_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ade47fabad327bcc17b99c2bae13f60180b06d6 --- /dev/null +++ b/resid_post/layer_31_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_65k_l0_medium/config.json b/resid_post/layer_31_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..64d04f466517160644d8bd8a092d8b928b7fcafd --- /dev/null +++ b/resid_post/layer_31_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_31_width_65k_l0_small/config.json b/resid_post/layer_31_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa0c70ad0b4786dfad6ff6a17e00d400aa2d150 --- /dev/null +++ b/resid_post/layer_31_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_16k_l0_medium/config.json b/resid_post/layer_41_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7a9e4b3230295e4253006d2ff9a4685a1dc96642 --- /dev/null +++ b/resid_post/layer_41_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_1m_l0_small/config.json b/resid_post/layer_41_width_1m_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..202c704695e8118b60ee437367bc8b751615cb5d --- /dev/null +++ b/resid_post/layer_41_width_1m_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 1048576, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_262k_l0_big/config.json b/resid_post/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfae99082665b3b6150d8b0efe670c254702388c --- /dev/null +++ b/resid_post/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_262k_l0_medium/config.json b/resid_post/layer_41_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f84a3182c09548a88011471e1b409a2b388fbc59 --- /dev/null +++ b/resid_post/layer_41_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_262k_l0_medium_seed_1/config.json b/resid_post/layer_41_width_262k_l0_medium_seed_1/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f84a3182c09548a88011471e1b409a2b388fbc59 --- /dev/null +++ b/resid_post/layer_41_width_262k_l0_medium_seed_1/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_65k_l0_big/config.json b/resid_post/layer_41_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f15d27e159e8ad00c84e7aaeb7a0f92265c4d6a3 --- /dev/null +++ b/resid_post/layer_41_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_65k_l0_medium/config.json b/resid_post/layer_41_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a9637b3e1dccbba67ef8deb423c555ea8829d28a --- /dev/null +++ b/resid_post/layer_41_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_41_width_65k_l0_small/config.json b/resid_post/layer_41_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec0d764fb5064d250d0c689d206f44435aca8dbf --- /dev/null +++ b/resid_post/layer_41_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 65536, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file