diff --git a/resid_post_all/layer_0_width_262k_l0_small/config.json b/resid_post_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..173a6ca294958bec4b4a56ee8db787fcbded5c72 --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_small/config.json b/resid_post_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5154af1c7b25a740404e74ccf80520ce01e4bc3b --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_small/config.json b/resid_post_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1cad04898d3b11d754375db87b00eacd9edb4c88 --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_big/config.json b/resid_post_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..31091eb5a38f51b8c998894155384d8ac122bfc9 --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 105, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_big/config.json b/resid_post_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dec5daeedd9eed714617c29fef51cceba4ac3cb9 --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 105, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_small/config.json b/resid_post_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6c15f43f3932864dd90c01aed514aec7d70804e7 --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_big/config.json b/resid_post_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e255639ad3d3e00b822a751e6aeb78c39df740c --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_small/config.json b/resid_post_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..27783a0363b6ef1d7951213d58d4b736c1205c14 --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_262k_l0_big/config.json b/resid_post_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a286c86a12f0501f6ed62fc40a818722ced46d41 --- /dev/null +++ b/resid_post_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_262k_l0_small/config.json b/resid_post_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b2e3f6bb84ee4c5bc57abc189435b775904235a6 --- /dev/null +++ b/resid_post_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_16k_l0_big/config.json b/resid_post_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..db343b0ac995474c60afc1fff145e97f381b757c --- /dev/null +++ b/resid_post_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_small/config.json b/resid_post_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..09284c78fb9cda7c1aa0a51d099473201f94a698 --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_small/config.json b/resid_post_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9176fcdf1ea3e69e9b9ddb6d946ab798346d6f5 --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_big/config.json b/resid_post_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..72e58b2dec41044e6b0d1c290243d72464b1dd50 --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_big/config.json b/resid_post_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..00e6a01306d57510ab07c7b81dbdc90b75a1e332 --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_big/config.json b/resid_post_all/layer_19_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..28cb5434e309571a0559d3e36b412a099bc23e1c --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_19_width_262k_l0_small/config.json b/resid_post_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11b7ba9293b0412bdf847a2a3d598c656a08ea90 --- /dev/null +++ b/resid_post_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.output", + "hf_hook_point_out": "model.layers.19.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_big/config.json b/resid_post_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfef4be98a920ca7a45f470c854ad071d4e6bc97 --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 63, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_262k_l0_big/config.json b/resid_post_all/layer_20_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..149d6331b6dab69ddd3ef5f97cd738321a096a1d --- /dev/null +++ b/resid_post_all/layer_20_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_16k_l0_small/config.json b/resid_post_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9efcc28a4aa9295656e8461b14d11c99f025aa0 --- /dev/null +++ b/resid_post_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_small/config.json b/resid_post_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4e0efd06a436a52460ca63717af5455b257cd664 --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_small/config.json b/resid_post_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..924919d7e3986a946ac1feda715fbc4f7f797ecd --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_big/config.json b/resid_post_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..532b65e98d169551c110137e817a1002c00de0df --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_16k_l0_small/config.json b/resid_post_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c31c10c337f5eccb780c431f17c70a3d1b4f930 --- /dev/null +++ b/resid_post_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_big/config.json b/resid_post_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..77f1ae6258238a0dfb57d90db30d6ab9e2ab4ae4 --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_small/config.json b/resid_post_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b286f9d39e890cb49be606543a0a09202841b96 --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_16k_l0_big/config.json b/resid_post_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1ab14bc4dbe0bbc36f4dc04ff1a2b0a1fc645297 --- /dev/null +++ b/resid_post_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_24_width_262k_l0_big/config.json b/resid_post_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0f1ee6a62bed08446677712fa8140c5487d498 --- /dev/null +++ b/resid_post_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.output", + "hf_hook_point_out": "model.layers.24.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_big/config.json b/resid_post_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6b7e71036085ada1f4de3bd57eaef352ade41366 --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_16k_l0_small/config.json b/resid_post_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e25080e4a7893c6dd6e384675bba99d4c3768c3a --- /dev/null +++ b/resid_post_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_small/config.json b/resid_post_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f6471a2d4451c3ab2aad2b87e8b0fdf5ae9948b --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_16k_l0_small/config.json b/resid_post_all/layer_26_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c71f3fc4f947dc47dc19a78199d09e46a25d53a6 --- /dev/null +++ b/resid_post_all/layer_26_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_262k_l0_big/config.json b/resid_post_all/layer_26_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..be517800214852ae8d70db090681fddd619ea00f --- /dev/null +++ b/resid_post_all/layer_26_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_262k_l0_small/config.json b/resid_post_all/layer_26_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b1055e99cad652c41a6da98d2969d04e00e9ce66 --- /dev/null +++ b/resid_post_all/layer_26_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_27_width_262k_l0_big/config.json b/resid_post_all/layer_27_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..47e46fe3f9b837cde3daf1c55ad225bb6e9f0dc3 --- /dev/null +++ b/resid_post_all/layer_27_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.output", + "hf_hook_point_out": "model.layers.27.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_27_width_262k_l0_small/config.json b/resid_post_all/layer_27_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..17f6ca08dae27744ad471f3fc106bac6b59357c6 --- /dev/null +++ b/resid_post_all/layer_27_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.output", + "hf_hook_point_out": "model.layers.27.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_28_width_16k_l0_small/config.json b/resid_post_all/layer_28_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0f1ce77efcd8e76bce13c385723b7690f612464a --- /dev/null +++ b/resid_post_all/layer_28_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.output", + "hf_hook_point_out": "model.layers.28.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_31_width_16k_l0_big/config.json b/resid_post_all/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7856e520d46cae373e4b2a669a6c3ef72dc360 --- /dev/null +++ b/resid_post_all/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_32_width_262k_l0_small/config.json b/resid_post_all/layer_32_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f7cb24a164044cab9662f8e5ea1273ca0a2c8087 --- /dev/null +++ b/resid_post_all/layer_32_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.output", + "hf_hook_point_out": "model.layers.32.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_33_width_16k_l0_small/config.json b/resid_post_all/layer_33_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f651141a707611667d0bfe1c8fa065bdafac4557 --- /dev/null +++ b/resid_post_all/layer_33_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.output", + "hf_hook_point_out": "model.layers.33.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_33_width_262k_l0_big/config.json b/resid_post_all/layer_33_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8db2f9ea7ee36ebb6b036f72650e1a11a7964d66 --- /dev/null +++ b/resid_post_all/layer_33_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.output", + "hf_hook_point_out": "model.layers.33.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_33_width_262k_l0_small/config.json b/resid_post_all/layer_33_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b32dd795d02b41f3adfa4afa0a42592ee02387fe --- /dev/null +++ b/resid_post_all/layer_33_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.output", + "hf_hook_point_out": "model.layers.33.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_35_width_16k_l0_big/config.json b/resid_post_all/layer_35_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1cd308737427a58f08b9993c3c20e0a036fccec1 --- /dev/null +++ b/resid_post_all/layer_35_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.output", + "hf_hook_point_out": "model.layers.35.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_35_width_262k_l0_small/config.json b/resid_post_all/layer_35_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ce650eb989a490a42264db5b05f2575df2a96a0 --- /dev/null +++ b/resid_post_all/layer_35_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.output", + "hf_hook_point_out": "model.layers.35.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_36_width_262k_l0_small/config.json b/resid_post_all/layer_36_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6e132b4c19e5f0f8646429f48e668ccb223d7aed --- /dev/null +++ b/resid_post_all/layer_36_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.36.output", + "hf_hook_point_out": "model.layers.36.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_37_width_16k_l0_big/config.json b/resid_post_all/layer_37_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e621e63bce44e552952b2ccb3c62ef01ee9a9ebe --- /dev/null +++ b/resid_post_all/layer_37_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.output", + "hf_hook_point_out": "model.layers.37.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_37_width_262k_l0_big/config.json b/resid_post_all/layer_37_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11b713ff5362c08027e6e0cfc0021a789bb97bc4 --- /dev/null +++ b/resid_post_all/layer_37_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.output", + "hf_hook_point_out": "model.layers.37.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_37_width_262k_l0_small/config.json b/resid_post_all/layer_37_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..25b8363e2d5138fd87bcd0e3a7dc59795c8cae29 --- /dev/null +++ b/resid_post_all/layer_37_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.output", + "hf_hook_point_out": "model.layers.37.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_38_width_262k_l0_big/config.json b/resid_post_all/layer_38_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa067c0e4ec56ace7fb57d194ddb89cbb29b428b --- /dev/null +++ b/resid_post_all/layer_38_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.38.output", + "hf_hook_point_out": "model.layers.38.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_39_width_16k_l0_small/config.json b/resid_post_all/layer_39_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..39ced971941148fba5ddc2a75fc2401eb03333ed --- /dev/null +++ b/resid_post_all/layer_39_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.39.output", + "hf_hook_point_out": "model.layers.39.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_big/config.json b/resid_post_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c48a9a1a1b08c80454bd63c046d7bf3cd725e0f3 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_small/config.json b/resid_post_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..08187288ae650875f5a4ea6a23611331b404de02 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_262k_l0_big/config.json b/resid_post_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..29cb796433d312f43fc92353d4d0912ab13f13b4 --- /dev/null +++ b/resid_post_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_40_width_16k_l0_big/config.json b/resid_post_all/layer_40_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9bd980637ab70e3068855d0b12593d0c268d4742 --- /dev/null +++ b/resid_post_all/layer_40_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.output", + "hf_hook_point_out": "model.layers.40.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_40_width_262k_l0_small/config.json b/resid_post_all/layer_40_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ce0251d2e7b3896e0ad90043c70d474ee984ddc --- /dev/null +++ b/resid_post_all/layer_40_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.output", + "hf_hook_point_out": "model.layers.40.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_41_width_262k_l0_big/config.json b/resid_post_all/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..13838ac3271306480f58bd7d4ad02f670361ba28 --- /dev/null +++ b/resid_post_all/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.output", + "hf_hook_point_out": "model.layers.41.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_43_width_16k_l0_big/config.json b/resid_post_all/layer_43_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f3ba3c04c5c606b83ab840fd5ed9294c36acd66b --- /dev/null +++ b/resid_post_all/layer_43_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.output", + "hf_hook_point_out": "model.layers.43.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_43_width_16k_l0_small/config.json b/resid_post_all/layer_43_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..36a714b84075b1a03f85c9b56d1b5e397a4fb2b4 --- /dev/null +++ b/resid_post_all/layer_43_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.output", + "hf_hook_point_out": "model.layers.43.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_43_width_262k_l0_small/config.json b/resid_post_all/layer_43_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..360ec99787ed66325b58a671aa2fcb9164e35389 --- /dev/null +++ b/resid_post_all/layer_43_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.output", + "hf_hook_point_out": "model.layers.43.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_44_width_16k_l0_big/config.json b/resid_post_all/layer_44_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4b3ca09abee8b1a7b172265ea364db810d5cb139 --- /dev/null +++ b/resid_post_all/layer_44_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.output", + "hf_hook_point_out": "model.layers.44.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_44_width_262k_l0_big/config.json b/resid_post_all/layer_44_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..734da2993124b6fb1af63b262506238acbff3e24 --- /dev/null +++ b/resid_post_all/layer_44_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.output", + "hf_hook_point_out": "model.layers.44.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_44_width_262k_l0_small/config.json b/resid_post_all/layer_44_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a7970348361af8555a0be5d190e7668b7a38367 --- /dev/null +++ b/resid_post_all/layer_44_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.output", + "hf_hook_point_out": "model.layers.44.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_45_width_262k_l0_big/config.json b/resid_post_all/layer_45_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a16f5dee7c929b9a0061b51c0cb00d60758076cb --- /dev/null +++ b/resid_post_all/layer_45_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.45.output", + "hf_hook_point_out": "model.layers.45.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_46_width_262k_l0_small/config.json b/resid_post_all/layer_46_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..18b5e8660d4b7a3a811d7ac5639b60a2f6932beb --- /dev/null +++ b/resid_post_all/layer_46_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.46.output", + "hf_hook_point_out": "model.layers.46.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_47_width_16k_l0_big/config.json b/resid_post_all/layer_47_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fedf47258362848594ace54f741066c1352fd815 --- /dev/null +++ b/resid_post_all/layer_47_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.output", + "hf_hook_point_out": "model.layers.47.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_47_width_16k_l0_small/config.json b/resid_post_all/layer_47_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..24b0fe8d668a6dc4fe9ecfc4c3cd55b0bfc36673 --- /dev/null +++ b/resid_post_all/layer_47_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.output", + "hf_hook_point_out": "model.layers.47.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_47_width_262k_l0_small/config.json b/resid_post_all/layer_47_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a5326fa3d88d91df8d7fbcd1813259a23d8f00f6 --- /dev/null +++ b/resid_post_all/layer_47_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.output", + "hf_hook_point_out": "model.layers.47.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_big/config.json b/resid_post_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..588f2bde66bf91227ca0a0c883b97157cbd63eb5 --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 75, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_small/config.json b/resid_post_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..75b15ebff4d8b7f893160898dff1e41a1c62d28a --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_small/config.json b/resid_post_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..70d03bba05e5b1ff6c9dc1c0bd1bb9b62d1281fe --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_big/config.json b/resid_post_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7946c8af28b94714f1c8fbc8a81e8b351301cbe --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 78, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_small/config.json b/resid_post_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9ecfc5ca0ad5fcd13983bfe74516d4b7b234d7 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_small/config.json b/resid_post_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..218f33a4311295a075e239f9121b222753c9ff9c --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_16k_l0_big/config.json b/resid_post_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a918b303e0ae44739812952456e85642bfe05c5 --- /dev/null +++ b/resid_post_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 86, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_16k_l0_small/config.json b/resid_post_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bfd683674745ad7e16dbdda32edf38a383589e77 --- /dev/null +++ b/resid_post_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_16k_l0_small/config.json b/resid_post_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..25061164f957ed8ee967710c6679f2988a4a01bd --- /dev/null +++ b/resid_post_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_8_width_262k_l0_small/config.json b/resid_post_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c319de4a15c388d7632680bf838a92420cb4182 --- /dev/null +++ b/resid_post_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.output", + "hf_hook_point_out": "model.layers.8.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_big/config.json b/resid_post_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..835aca3e2e32d2e270f686b7bd03fb65a2c7de28 --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 93, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_9_width_262k_l0_small/config.json b/resid_post_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6625841723c2f46f61987b702edd5d03984765c4 --- /dev/null +++ b/resid_post_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file