diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd530668308b13495bce20ece37b6c5be48c0cbd --- /dev/null +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_16k_l0_small/config.json b/mlp_out_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..021aa5f75cde3381e02e5bb89f943e4ed622f1cd --- /dev/null +++ b/mlp_out_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_small/config.json b/mlp_out_all/layer_10_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7cda58a5cf51c5b954ef920c31b4c7a05c97ab0 --- /dev/null +++ b/mlp_out_all/layer_10_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_12_width_16k_l0_big/config.json b/mlp_out_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f88fc5e4776e0701f9fbfbf7de0550d7faf5ff4 --- /dev/null +++ b/mlp_out_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 105, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_262k_l0_small/config.json b/mlp_out_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..937a881fa28ac950b9a9efb695535b7ba2fbcaf9 --- /dev/null +++ b/mlp_out_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_big/config.json b/mlp_out_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9036d59c1630b4318206950214a291d8f38889f7 --- /dev/null +++ b/mlp_out_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_small/config.json b/mlp_out_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b9ed539c1992451447021a460a6bd2fc797eef3 --- /dev/null +++ b/mlp_out_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_small/config.json b/mlp_out_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b1d1e786c5fc8b7d3702812e0aea22152e11870 --- /dev/null +++ b/mlp_out_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_262k_l0_small/config.json b/mlp_out_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..89347d1a87b468a875cd70f6380f8ebb2f7e6c11 --- /dev/null +++ b/mlp_out_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_1_width_262k_l0_big/config.json b/mlp_out_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..44389cf4e0acd12f44c3d7c3b6ab428690868c5f --- /dev/null +++ b/mlp_out_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.1.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 63, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_16k_l0_small/config.json b/mlp_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..66118a4a6d3339f9bad23993283a72850ede758d --- /dev/null +++ b/mlp_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_262k_l0_small/config.json b/mlp_out_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..dd3a967d6981ecbd7b71fba25fb738dc3f82eaee --- /dev/null +++ b/mlp_out_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_16k_l0_small/config.json b/mlp_out_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..92b720997f8f31607132afb2d14b5321f91500cc --- /dev/null +++ b/mlp_out_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_262k_l0_big/config.json b/mlp_out_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d96881dca288562535d9a3d9f9383ea29385bba --- /dev/null +++ b/mlp_out_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_big/config.json b/mlp_out_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a32e3c70a2a3f2c324121b23e08a15e68b579080 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_small/config.json b/mlp_out_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b87da90d75fd3c40cac56bd00c9964a4351e2751 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_262k_l0_big/config.json b/mlp_out_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82ac7eda6b47d4f3bf399f3687b03d5aad84a947 --- /dev/null +++ b/mlp_out_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_big/config.json b/mlp_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cc26f3a919b93ab95494ed4c55908eb18984c3e7 --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_small/config.json b/mlp_out_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4c35887be797eb985af6c385d5a61e82722fdd6f --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_262k_l0_small/config.json b/mlp_out_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5ca8e25929f87fa02c65bb4a989b7c3e38b7cc5a --- /dev/null +++ b/mlp_out_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_26_width_16k_l0_small/config.json b/mlp_out_all/layer_26_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e3c12127c00c0bf9898a694349e3258f97c2da67 --- /dev/null +++ b/mlp_out_all/layer_26_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_27_width_262k_l0_big/config.json b/mlp_out_all/layer_27_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..70eccb7a35e8f0a44ae6213669e34f04894c53a7 --- /dev/null +++ b/mlp_out_all/layer_27_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_27_width_262k_l0_small/config.json b/mlp_out_all/layer_27_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..406a3b98797d0ede3c8c8343405ab44882e486cc --- /dev/null +++ b/mlp_out_all/layer_27_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_28_width_16k_l0_small/config.json b/mlp_out_all/layer_28_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1743a23ba4cf507d82b5c986a3280f2605d9e80f --- /dev/null +++ b/mlp_out_all/layer_28_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_31_width_16k_l0_big/config.json b/mlp_out_all/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f7b1fd1d21e08f1477141a42c23fc77206e1acda --- /dev/null +++ b/mlp_out_all/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_32_width_262k_l0_small/config.json b/mlp_out_all/layer_32_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df3b9ea3fa433f7fe00e8649ed3df7e685290b03 --- /dev/null +++ b/mlp_out_all/layer_32_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.32.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_33_width_16k_l0_small/config.json b/mlp_out_all/layer_33_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..50f106f12f0a764bdcc3c0f51dec819bd6b381e5 --- /dev/null +++ b/mlp_out_all/layer_33_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_33_width_262k_l0_big/config.json b/mlp_out_all/layer_33_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3fca4a6a02448fdae915c605c3fac38a20fac0b5 --- /dev/null +++ b/mlp_out_all/layer_33_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_35_width_16k_l0_big/config.json b/mlp_out_all/layer_35_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef82df953adb50d9118356370156aa45f7ac815 --- /dev/null +++ b/mlp_out_all/layer_35_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_35_width_262k_l0_small/config.json b/mlp_out_all/layer_35_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4aeb9b8f5040d9424ac5b9b6185231a4f441b386 --- /dev/null +++ b/mlp_out_all/layer_35_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_36_width_262k_l0_small/config.json b/mlp_out_all/layer_36_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5f145b14837c613aa28c883012faf7ee2d4c073f --- /dev/null +++ b/mlp_out_all/layer_36_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.36.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_16k_l0_big/config.json b/mlp_out_all/layer_37_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..118d6916528ec766f42d99ca2aae13eafadcba0b --- /dev/null +++ b/mlp_out_all/layer_37_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_262k_l0_small/config.json b/mlp_out_all/layer_37_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a67bbf1d4aa5539dd4ec8fdd57879f63a62f994 --- /dev/null +++ b/mlp_out_all/layer_37_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_38_width_262k_l0_big/config.json b/mlp_out_all/layer_38_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fd73c9b237985827bcb19e9315cfae69448f5e60 --- /dev/null +++ b/mlp_out_all/layer_38_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.38.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_39_width_16k_l0_small/config.json b/mlp_out_all/layer_39_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4ba327a3e9e425a4a977223f04d3606d0d61f4bc --- /dev/null +++ b/mlp_out_all/layer_39_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.39.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_big/config.json b/mlp_out_all/layer_3_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d4a316440478df5dbc07d5e860cdb5b36b348cca --- /dev/null +++ b/mlp_out_all/layer_3_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_16k_l0_small/config.json b/mlp_out_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..428ef41f67777030df1e2ea531f2b6e9622964ec --- /dev/null +++ b/mlp_out_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_big/config.json b/mlp_out_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9dd052f523fae7eacc37fc73395cfb774da74799 --- /dev/null +++ b/mlp_out_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_40_width_16k_l0_big/config.json b/mlp_out_all/layer_40_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7f163dacf0d0ae5e5ccbc107a95a05947a9717a0 --- /dev/null +++ b/mlp_out_all/layer_40_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_40_width_262k_l0_small/config.json b/mlp_out_all/layer_40_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8f75e243a6e7a92fce77c36e57dc5dbed0745193 --- /dev/null +++ b/mlp_out_all/layer_40_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_41_width_262k_l0_big/config.json b/mlp_out_all/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf1a09615f15a327fa487f723808757001d5c66e --- /dev/null +++ b/mlp_out_all/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_16k_l0_big/config.json b/mlp_out_all/layer_43_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..221b3a5b4cf9eeb5f1486c5bf5c278c303454da6 --- /dev/null +++ b/mlp_out_all/layer_43_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_16k_l0_small/config.json b/mlp_out_all/layer_43_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df461627f6f6149253c703bba7d0262bcf4d48f0 --- /dev/null +++ b/mlp_out_all/layer_43_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_262k_l0_small/config.json b/mlp_out_all/layer_43_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6f4b28935eb790406175401251b75aa25d6365ed --- /dev/null +++ b/mlp_out_all/layer_43_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_44_width_16k_l0_big/config.json b/mlp_out_all/layer_44_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7042b56ac740c22cee55c7cf2c43948c92638b70 --- /dev/null +++ b/mlp_out_all/layer_44_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_44_width_262k_l0_big/config.json b/mlp_out_all/layer_44_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..37da92ee3a47affc66d8661177d2df1708edc4fd --- /dev/null +++ b/mlp_out_all/layer_44_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_44_width_262k_l0_small/config.json b/mlp_out_all/layer_44_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b169bd86e8b7770473e00f7a7c06d852abfff7c6 --- /dev/null +++ b/mlp_out_all/layer_44_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.44.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.44.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_45_width_262k_l0_big/config.json b/mlp_out_all/layer_45_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..539f8278cf0ef431ddd1f392353bd2869b991040 --- /dev/null +++ b/mlp_out_all/layer_45_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.45.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_46_width_262k_l0_small/config.json b/mlp_out_all/layer_46_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1305c4b621cfaa36af9aaf026a96d6ea31c9f597 --- /dev/null +++ b/mlp_out_all/layer_46_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.46.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_47_width_16k_l0_small/config.json b/mlp_out_all/layer_47_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..02d8c5e137e5ffad25d0fe46481905dcea54ed8e --- /dev/null +++ b/mlp_out_all/layer_47_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_47_width_262k_l0_small/config.json b/mlp_out_all/layer_47_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f03643d21ed4bd75b8709b03dfddc7058e3b3618 --- /dev/null +++ b/mlp_out_all/layer_47_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_big/config.json b/mlp_out_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3162877bce072efd4855c63891a1d26339060fd9 --- /dev/null +++ b/mlp_out_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 75, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_small/config.json b/mlp_out_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4fd73be7d2c5a0b2deb5b587b5ff7cd2a192c67 --- /dev/null +++ b/mlp_out_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_small/config.json b/mlp_out_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e20bb495fd338e464515d76f66f4bc54a8a7278 --- /dev/null +++ b/mlp_out_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_big/config.json b/mlp_out_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a7957cbf674db3e25453595e13a845c6a28e32f6 --- /dev/null +++ b/mlp_out_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 78, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_small/config.json b/mlp_out_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..07a3004b54aca8f535b56466d8baaf5fdb6a3b62 --- /dev/null +++ b/mlp_out_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5417267a1ec0a22e7bd5d138f6dcd5e6c5047ebd --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 86, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_small/config.json b/mlp_out_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7de585981c6da313bdd15e7608a0534159d49160 --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_small/config.json b/mlp_out_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d6bc71236a4d57dc8cc2c31e377693363d4ade2c --- /dev/null +++ b/mlp_out_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_small/config.json b/mlp_out_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..694387d2ecde9fdef97f60f696a0a857c20bd225 --- /dev/null +++ b/mlp_out_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_big/config.json b/mlp_out_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0acd882df72fc9d5e6a044d685d393796872a27d --- /dev/null +++ b/mlp_out_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-pt", + "architecture": "jump_relu", + "l0": 93, + "affine_connection": false +} \ No newline at end of file