diff --git a/mlp_out_all/layer_0_width_16k_l0_small/config.json b/mlp_out_all/layer_0_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..62341447359b14081616db4a0ac8009ebba58402 --- /dev/null +++ b/mlp_out_all/layer_0_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f2de7d44d3d8868b114be884b1772c7e6a40a3d5 --- /dev/null +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_11_width_16k_l0_small/config.json b/mlp_out_all/layer_11_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0bbe6efada2881eca2d419088cb8b823dd82cc22 --- /dev/null +++ b/mlp_out_all/layer_11_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.11.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.11.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_big/config.json b/mlp_out_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a3496e6eb7f442fcbf5977bf16ebcbfcd2a64d6 --- /dev/null +++ b/mlp_out_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 97, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_262k_l0_big/config.json b/mlp_out_all/layer_14_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..91d1125fb30235328d51677b42f697f5a0a7f6c1 --- /dev/null +++ b/mlp_out_all/layer_14_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 100, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_16k_l0_small/config.json b/mlp_out_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23ec24f52b28843e91675780642d57d768cf3e50 --- /dev/null +++ b/mlp_out_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_big/config.json b/mlp_out_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..31c5f0f01004455589f14d290709b1459d2e80bc --- /dev/null +++ b/mlp_out_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 106, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_big/config.json b/mlp_out_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23341a82fc3cb256406500121d141ad4788b7a6f --- /dev/null +++ b/mlp_out_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 109, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_small/config.json b/mlp_out_all/layer_17_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec82360654282aadb9f1622a6d3018f1f94ca71e --- /dev/null +++ b/mlp_out_all/layer_17_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_262k_l0_big/config.json b/mlp_out_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..80a284c99ac349f3c21f5b5e97ce4bfdaaee13cb --- /dev/null +++ b/mlp_out_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_262k_l0_small/config.json b/mlp_out_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32deab0558c721f9483bad5dad1858174232ed8e --- /dev/null +++ b/mlp_out_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_19_width_16k_l0_small/config.json b/mlp_out_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a327bb80901033a1b32044b2c28e17f0b82ac199 --- /dev/null +++ b/mlp_out_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.19.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_16k_l0_small/config.json b/mlp_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fd20ec9bb3dc4540861aea3a5ea59260c4ebfa49 --- /dev/null +++ b/mlp_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_16k_l0_small/config.json b/mlp_out_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..009866570cf1473b2549d2670a30e51e4f4df9e8 --- /dev/null +++ b/mlp_out_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_big/config.json b/mlp_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..29ccbb17deb19873efe5029eef4675b2bd6d25fc --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_small/config.json b/mlp_out_all/layer_25_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fa7e74488e0022e74dc2a1a7f7dbab2345356420 --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_262k_l0_big/config.json b/mlp_out_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8cf860d4fbe22e918edff7e503e1bd088cb8d6c --- /dev/null +++ b/mlp_out_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_26_width_16k_l0_small/config.json b/mlp_out_all/layer_26_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3987cbd2475feb1bf5b5e289fd1a9a158e912dda --- /dev/null +++ b/mlp_out_all/layer_26_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_27_width_16k_l0_big/config.json b/mlp_out_all/layer_27_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..db5b3e0a0b740eb8455c893165def773b3bff172 --- /dev/null +++ b/mlp_out_all/layer_27_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_27_width_262k_l0_small/config.json b/mlp_out_all/layer_27_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ff1a0e2165defa0c9591c8b1bafddaf59be48b05 --- /dev/null +++ b/mlp_out_all/layer_27_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.27.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_28_width_262k_l0_big/config.json b/mlp_out_all/layer_28_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f61a65f7fd2437a94dfcdabf8e87b94171af56c0 --- /dev/null +++ b/mlp_out_all/layer_28_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_29_width_16k_l0_big/config.json b/mlp_out_all/layer_29_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9c864e7bb9f39df94015f918c62c75c115ae6630 --- /dev/null +++ b/mlp_out_all/layer_29_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_29_width_16k_l0_small/config.json b/mlp_out_all/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0e279da6a647aae3d437f9a8f9ef2c940b40093 --- /dev/null +++ b/mlp_out_all/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_big/config.json b/mlp_out_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..59a158e7e224e174b4681b64cd56de0f32d9426f --- /dev/null +++ b/mlp_out_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 65, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_262k_l0_big/config.json b/mlp_out_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ee25a6a4adf9dfb47e8a18821d9e14bfab8433e2 --- /dev/null +++ b/mlp_out_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 65, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_30_width_16k_l0_big/config.json b/mlp_out_all/layer_30_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..afe0677e918737113f44c6fd8e9314fa95514983 --- /dev/null +++ b/mlp_out_all/layer_30_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_33_width_16k_l0_small/config.json b/mlp_out_all/layer_33_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..72c63e9335353f88eacbbe12db0acce3d2b0d458 --- /dev/null +++ b/mlp_out_all/layer_33_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.33.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_34_width_262k_l0_small/config.json b/mlp_out_all/layer_34_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0ababcba8c772102dd00ef4830122b4c2a2e955 --- /dev/null +++ b/mlp_out_all/layer_34_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.34.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.34.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_35_width_262k_l0_big/config.json b/mlp_out_all/layer_35_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..db0c4de2900e8f1f22fd430843671d3800508245 --- /dev/null +++ b/mlp_out_all/layer_35_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_35_width_262k_l0_small/config.json b/mlp_out_all/layer_35_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f0ebc627bd226a76df682b28d5d4bcfd95f916d4 --- /dev/null +++ b/mlp_out_all/layer_35_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_36_width_262k_l0_big/config.json b/mlp_out_all/layer_36_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb7ec2c99c49aa476cd17b611440753558764f42 --- /dev/null +++ b/mlp_out_all/layer_36_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.36.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_16k_l0_small/config.json b/mlp_out_all/layer_37_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6eac354cc2d444f0541bae118f870003339203ac --- /dev/null +++ b/mlp_out_all/layer_37_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_38_width_16k_l0_small/config.json b/mlp_out_all/layer_38_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5a2c4b92b1496534e360e74b6918311cb6a9779 --- /dev/null +++ b/mlp_out_all/layer_38_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.38.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_38_width_262k_l0_big/config.json b/mlp_out_all/layer_38_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c33db4310f01fcc8acb6c6412a0f609598fe4b3a --- /dev/null +++ b/mlp_out_all/layer_38_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.38.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.38.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_40_width_262k_l0_big/config.json b/mlp_out_all/layer_40_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..361e74823de3dc3cf7df5a79a8166140bc639af5 --- /dev/null +++ b/mlp_out_all/layer_40_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_41_width_16k_l0_big/config.json b/mlp_out_all/layer_41_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4c9e940c978f632149c6f73f00b016c490d9ad40 --- /dev/null +++ b/mlp_out_all/layer_41_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_41_width_16k_l0_small/config.json b/mlp_out_all/layer_41_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce59e245d17de9c0e3d75700dadc7e116eae65f --- /dev/null +++ b/mlp_out_all/layer_41_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_41_width_262k_l0_big/config.json b/mlp_out_all/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..733a0c25a05f0318087474edf52deffc123ac531 --- /dev/null +++ b/mlp_out_all/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_42_width_262k_l0_big/config.json b/mlp_out_all/layer_42_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..661f7187d0596184a34d67e9efe603493bc2dafb --- /dev/null +++ b/mlp_out_all/layer_42_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.42.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_16k_l0_big/config.json b/mlp_out_all/layer_43_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c242c1e5c1d145b19b837485e17ec676b6a9369f --- /dev/null +++ b/mlp_out_all/layer_43_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_16k_l0_small/config.json b/mlp_out_all/layer_43_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f8418fb4d94199dc3599c8fd899704a57cf7c089 --- /dev/null +++ b/mlp_out_all/layer_43_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_45_width_16k_l0_big/config.json b/mlp_out_all/layer_45_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..545398a1db0eb1db68365bc84c71a2b27aa17273 --- /dev/null +++ b/mlp_out_all/layer_45_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.45.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_46_width_16k_l0_small/config.json b/mlp_out_all/layer_46_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..618d77d072dda334bfc61e796a8e9dd0c17d8aa9 --- /dev/null +++ b/mlp_out_all/layer_46_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.46.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_49_width_262k_l0_small/config.json b/mlp_out_all/layer_49_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..019c849caa62da63b903ae66a25bd4bf22e2e823 --- /dev/null +++ b/mlp_out_all/layer_49_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.49.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.49.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_big/config.json b/mlp_out_all/layer_4_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..891521a5619ac8bb64cdcba2fea6f7e1f87e1ff9 --- /dev/null +++ b/mlp_out_all/layer_4_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_16k_l0_small/config.json b/mlp_out_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..88b065c091f1aa3b1f31d441b503ae3e2fddc91b --- /dev/null +++ b/mlp_out_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_4_width_262k_l0_small/config.json b/mlp_out_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..14de844f57170c34e0b1297a619f9fdd130aab71 --- /dev/null +++ b/mlp_out_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.4.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_50_width_16k_l0_small/config.json b/mlp_out_all/layer_50_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..727777396f3aea47a8ce613418c47e95943ed0bb --- /dev/null +++ b/mlp_out_all/layer_50_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.50.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_50_width_262k_l0_small/config.json b/mlp_out_all/layer_50_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..edb251f9120358513371f51bf51ce6bbbdeeabff --- /dev/null +++ b/mlp_out_all/layer_50_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.50.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.50.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_51_width_16k_l0_big/config.json b/mlp_out_all/layer_51_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d6a4aee42bededefa8e22622f79ab88df28acfb3 --- /dev/null +++ b/mlp_out_all/layer_51_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.51.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_51_width_262k_l0_big/config.json b/mlp_out_all/layer_51_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f556945af5c2b87e4e8117706af434127c0eb26d --- /dev/null +++ b/mlp_out_all/layer_51_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.51.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.51.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_52_width_262k_l0_big/config.json b/mlp_out_all/layer_52_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9737180a269f68f5edb85125bc0d4460fdcac802 --- /dev/null +++ b/mlp_out_all/layer_52_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.52.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.52.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_54_width_262k_l0_big/config.json b/mlp_out_all/layer_54_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f2fa5afb1786544bcf435e4bfe52d2f8c3199686 --- /dev/null +++ b/mlp_out_all/layer_54_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.54.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.54.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_55_width_16k_l0_small/config.json b/mlp_out_all/layer_55_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..69759c1c2425019948eeb0a644126fcabc110307 --- /dev/null +++ b/mlp_out_all/layer_55_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.55.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_55_width_262k_l0_big/config.json b/mlp_out_all/layer_55_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d67d015c97aaca743704d76056c69e7bfc6c968 --- /dev/null +++ b/mlp_out_all/layer_55_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.55.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.55.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_57_width_16k_l0_small/config.json b/mlp_out_all/layer_57_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e6eecb570ed01d9d99ec641442e8d3ad55399b91 --- /dev/null +++ b/mlp_out_all/layer_57_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.57.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.57.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_58_width_16k_l0_big/config.json b/mlp_out_all/layer_58_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..05aa64815918cfcf3f8d01e4afa9e73c726b6cfe --- /dev/null +++ b/mlp_out_all/layer_58_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.58.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_58_width_16k_l0_small/config.json b/mlp_out_all/layer_58_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7e492f3a4d15242088cab0ed402d23ddd7456d90 --- /dev/null +++ b/mlp_out_all/layer_58_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.58.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.58.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_59_width_16k_l0_small/config.json b/mlp_out_all/layer_59_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f27927f3cbd6516234bb73dc1b0033fa386cc74e --- /dev/null +++ b/mlp_out_all/layer_59_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.59.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.59.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_small/config.json b/mlp_out_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b50b9d51fff89ede039095fc962c657e5742f341 --- /dev/null +++ b/mlp_out_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_60_width_262k_l0_big/config.json b/mlp_out_all/layer_60_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cf67683834c9e20e2b98ad4159ff5e7cdc91964f --- /dev/null +++ b/mlp_out_all/layer_60_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.60.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.60.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_61_width_262k_l0_big/config.json b/mlp_out_all/layer_61_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3dea7a87a35ece7638c6b0a7a9b712dc23ff61d0 --- /dev/null +++ b/mlp_out_all/layer_61_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.61.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.61.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f106d24b2377013d8c8d02de32190224bf1a1a1c --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 80, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_16k_l0_small/config.json b/mlp_out_all/layer_8_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..97bf27b92e2e4a8d75a51a6ef0a30e90ef0b6327 --- /dev/null +++ b/mlp_out_all/layer_8_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-27b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file