diff --git a/attn_out_all/layer_10_width_16k_l0_small/config.json b/attn_out_all/layer_10_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..43b8225c3c6495fa2a1bf187ac586da2f331d406 --- /dev/null +++ b/attn_out_all/layer_10_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.10.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_11_width_262k_l0_small/config.json b/attn_out_all/layer_11_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2117ff26951fcec207848b3ba738839a7b1129d4 --- /dev/null +++ b/attn_out_all/layer_11_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.11.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.11.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 19, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_12_width_262k_l0_big/config.json b/attn_out_all/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..369b13ee9849c546dc3efd17ca28925966b51f47 --- /dev/null +++ b/attn_out_all/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.12.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_16k_l0_small/config.json b/attn_out_all/layer_13_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d72e3a911e25f139b8e3978b35f9af8df90f09e5 --- /dev/null +++ b/attn_out_all/layer_13_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_13_width_262k_l0_big/config.json b/attn_out_all/layer_13_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c4184803670681eefab43ab5cf5287c374269def --- /dev/null +++ b/attn_out_all/layer_13_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.13.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_17_width_16k_l0_small/config.json b/attn_out_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ecf9b06503dc8a6570e728cc56949643826fd7 --- /dev/null +++ b/attn_out_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.17.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_18_width_262k_l0_big/config.json b/attn_out_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7715c235016fc26e98ca263c853befd545775af7 --- /dev/null +++ b/attn_out_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.18.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_16k_l0_big/config.json b/attn_out_all/layer_19_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..90176af8eb6ae086ecff3e421fabeb8aaff483a9 --- /dev/null +++ b/attn_out_all/layer_19_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_16k_l0_small/config.json b/attn_out_all/layer_19_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b90bb13258997137dce9086343118f10d92e0d37 --- /dev/null +++ b/attn_out_all/layer_19_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_19_width_262k_l0_small/config.json b/attn_out_all/layer_19_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..542b25af64b821123760a49f56b6ba1a82da2535 --- /dev/null +++ b/attn_out_all/layer_19_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.19.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.19.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_1_width_16k_l0_big/config.json b/attn_out_all/layer_1_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15b395b9f779b5e3f31df6988fa559234eb2c42 --- /dev/null +++ b/attn_out_all/layer_1_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.1.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 65, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_20_width_16k_l0_big/config.json b/attn_out_all/layer_20_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b78fada17399de52f22f4c9802d736fab0c43c0 --- /dev/null +++ b/attn_out_all/layer_20_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.20.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.20.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_16k_l0_big/config.json b/attn_out_all/layer_21_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f72720551d20b72f257f781c6fa1fbfedd6063fa --- /dev/null +++ b/attn_out_all/layer_21_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_21_width_16k_l0_small/config.json b/attn_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..22bbb42c19551b3a971f7a00e64c2f3c7dd567ab --- /dev/null +++ b/attn_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.21.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_22_width_262k_l0_small/config.json b/attn_out_all/layer_22_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7543bad9df61d39c9622cb38151c24c1563c2173 --- /dev/null +++ b/attn_out_all/layer_22_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.22.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_23_width_16k_l0_small/config.json b/attn_out_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32b3014ae354d04915c93f2196981587f764ca1e --- /dev/null +++ b/attn_out_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.23.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_16k_l0_big/config.json b/attn_out_all/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c9615daeb90b922250a9c7d8c501ed1e2ff7b4 --- /dev/null +++ b/attn_out_all/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_262k_l0_big/config.json b/attn_out_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5853ad75c22646c42bb58d344171091c339c2645 --- /dev/null +++ b/attn_out_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_24_width_262k_l0_small/config.json b/attn_out_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..96046ccd33d7c3bb9353b56ef75c4852eddffc85 --- /dev/null +++ b/attn_out_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.24.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_16k_l0_big/config.json b/attn_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d6537557ba135e3bc5917e7508ec7d52521da5a0 --- /dev/null +++ b/attn_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_25_width_262k_l0_small/config.json b/attn_out_all/layer_25_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f53cec14ed0a92f3745c0192a7f07bd2b48ee241 --- /dev/null +++ b/attn_out_all/layer_25_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.25.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_26_width_16k_l0_big/config.json b/attn_out_all/layer_26_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..238c4d23d0852814dd8e4915e7f9ed44da4e834e --- /dev/null +++ b/attn_out_all/layer_26_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.26.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_26_width_262k_l0_big/config.json b/attn_out_all/layer_26_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2545f7f11ba0ed9e0130d5d04aae49867b9ce43 --- /dev/null +++ b/attn_out_all/layer_26_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.26.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_27_width_262k_l0_small/config.json b/attn_out_all/layer_27_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b0b6708a9c4d3f38bd18363db9a66a0689c91add --- /dev/null +++ b/attn_out_all/layer_27_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.27.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_28_width_16k_l0_big/config.json b/attn_out_all/layer_28_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7534b9305f08a2e4850193d0baed6c82ced696c6 --- /dev/null +++ b/attn_out_all/layer_28_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.28.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_29_width_16k_l0_big/config.json b/attn_out_all/layer_29_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2e136646463675b103b5c7a2db0219aa227b89b9 --- /dev/null +++ b/attn_out_all/layer_29_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.29.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_29_width_16k_l0_small/config.json b/attn_out_all/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..56512f791eb0a44a0ea54834a2356335f43135d9 --- /dev/null +++ b/attn_out_all/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.29.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_2_width_262k_l0_small/config.json b/attn_out_all/layer_2_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..17397babbf2f54626c056b800bd37a38bd01d434 --- /dev/null +++ b/attn_out_all/layer_2_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.2.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_30_width_16k_l0_small/config.json b/attn_out_all/layer_30_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..237e9a93b3a9c22bd317f8597481acb91ac55086 --- /dev/null +++ b/attn_out_all/layer_30_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.30.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_30_width_262k_l0_small/config.json b/attn_out_all/layer_30_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..002fd0b7eea6de8ff93c0be6630666bde074135b --- /dev/null +++ b/attn_out_all/layer_30_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.30.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_32_width_16k_l0_big/config.json b/attn_out_all/layer_32_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9818aa5fab7b4b3f99276d0744c7755bec854b57 --- /dev/null +++ b/attn_out_all/layer_32_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.32.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_32_width_16k_l0_small/config.json b/attn_out_all/layer_32_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aef809dcdb6391a4a4af74c3426a7dc9238f9da2 --- /dev/null +++ b/attn_out_all/layer_32_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.32.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.32.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_33_width_262k_l0_small/config.json b/attn_out_all/layer_33_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df7a7940c09de3438dd6caeab2fb9a6036bf7506 --- /dev/null +++ b/attn_out_all/layer_33_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.33.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_3_width_262k_l0_small/config.json b/attn_out_all/layer_3_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cba8f1430ce1987d64279b359bf3a9e2ea96d6fc --- /dev/null +++ b/attn_out_all/layer_3_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.3.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_5_width_262k_l0_big/config.json b/attn_out_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1c8ed2495e2662dccde810123dc654252bd29d23 --- /dev/null +++ b/attn_out_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.5.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 86, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_6_width_16k_l0_big/config.json b/attn_out_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cc39ff295ef2443a6032e36da62ffc93d89071f7 --- /dev/null +++ b/attn_out_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.6.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 91, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_16k_l0_big/config.json b/attn_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d1a2631c41c372b6b445fe489adbe319630f5e80 --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 97, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_7_width_16k_l0_small/config.json b/attn_out_all/layer_7_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2c20d6239128be925a4e1af6fcf080416247a109 --- /dev/null +++ b/attn_out_all/layer_7_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.7.self_attn.o_proj.input", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_262k_l0_big/config.json b/attn_out_all/layer_9_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2430aa5334db765948ee59fadfa92ea24a5c0d7e --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 107, + "affine_connection": false +} \ No newline at end of file diff --git a/attn_out_all/layer_9_width_262k_l0_small/config.json b/attn_out_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdb2781cb7efeb52a2ce915fddf279a0b90a8be7 --- /dev/null +++ b/attn_out_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.self_attn.o_proj.input", + "hf_hook_point_out": "model.layers.9.self_attn.o_proj.input", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_17_width_65k_l0_small/config.json b/resid_post/layer_17_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd1b3d09aaac477447472b93bc6ea6cc16a2f77d --- /dev/null +++ b/resid_post/layer_17_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_29_width_262k_l0_small/config.json b/resid_post/layer_29_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..73b6ec4a738606a5579aefd5de463d09a71da3bc --- /dev/null +++ b/resid_post/layer_29_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_16k_l0_small/config.json b/resid_post/layer_9_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bdc5309a9c7de8a5b4726cd55a94236ab00aa1c8 --- /dev/null +++ b/resid_post/layer_9_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post/layer_9_width_65k_l0_small/config.json b/resid_post/layer_9_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9044e3d51188e6072e17716271e1ac692f1685af --- /dev/null +++ b/resid_post/layer_9_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.output", + "hf_hook_point_out": "model.layers.9.output", + "width": 65536, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_16k_l0_big/config.json b/resid_post_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e8a8e56ea43fe66f1208f9cc226b12b6b07fe9de --- /dev/null +++ b/resid_post_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_0_width_262k_l0_big/config.json b/resid_post_all/layer_0_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf090de0aed43e2fa01a104730416ce7e0f435f8 --- /dev/null +++ b/resid_post_all/layer_0_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.output", + "hf_hook_point_out": "model.layers.0.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_16k_l0_big/config.json b/resid_post_all/layer_10_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..9086605d13b44efdc71902f4c12c6248c56ee970 --- /dev/null +++ b/resid_post_all/layer_10_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_10_width_262k_l0_big/config.json b/resid_post_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..06cfa322395cddc6d5fb875368f06daf27824821 --- /dev/null +++ b/resid_post_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.output", + "hf_hook_point_out": "model.layers.10.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_big/config.json b/resid_post_all/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7c8d1726d1e8491acce8c98158e20d2b655d2c04 --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_16k_l0_small/config.json b/resid_post_all/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a3b0a2853561ae033a22b5102dc695ad141f1fec --- /dev/null +++ b/resid_post_all/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_12_width_262k_l0_small/config.json b/resid_post_all/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..70fbcb91dff3201232f2dc8b6a72e6941fe0a680 --- /dev/null +++ b/resid_post_all/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.output", + "hf_hook_point_out": "model.layers.12.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_13_width_16k_l0_big/config.json b/resid_post_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f6311d150e9703f020f0a6a5cf3422bb1086c0ae --- /dev/null +++ b/resid_post_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.output", + "hf_hook_point_out": "model.layers.13.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_14_width_262k_l0_small/config.json b/resid_post_all/layer_14_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..83ac280d09175b6b688317e1fe5e4241ff2d2973 --- /dev/null +++ b/resid_post_all/layer_14_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.output", + "hf_hook_point_out": "model.layers.14.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_16k_l0_small/config.json b/resid_post_all/layer_15_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..650a9de1e570315e18272d0610667b15fc9c5830 --- /dev/null +++ b/resid_post_all/layer_15_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_262k_l0_big/config.json b/resid_post_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f897119ad4c0edb1a57eda438abcbc6d6077fa9 --- /dev/null +++ b/resid_post_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_15_width_262k_l0_small/config.json b/resid_post_all/layer_15_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f3a99f74f2bce4115333198443b401636275119d --- /dev/null +++ b/resid_post_all/layer_15_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.output", + "hf_hook_point_out": "model.layers.15.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_16k_l0_small/config.json b/resid_post_all/layer_16_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2044d61b317b29293c4f0df5912249a4bb8e355c --- /dev/null +++ b/resid_post_all/layer_16_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_16_width_262k_l0_small/config.json b/resid_post_all/layer_16_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183be0a24c93e2c1f5ddd6569c7080c05258327f --- /dev/null +++ b/resid_post_all/layer_16_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.output", + "hf_hook_point_out": "model.layers.16.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_big/config.json b/resid_post_all/layer_17_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f13df5647006ddc361356a1b1052a45ffa9ac0e8 --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_16k_l0_small/config.json b/resid_post_all/layer_17_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..27cb1162cdc08d23f603748a40fd671fdb7d245a --- /dev/null +++ b/resid_post_all/layer_17_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_17_width_262k_l0_big/config.json b/resid_post_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ab1c787b0d316aa17fb089218b7cc916a0fc6cef --- /dev/null +++ b/resid_post_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.output", + "hf_hook_point_out": "model.layers.17.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_16k_l0_small/config.json b/resid_post_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0167029c88277718844c67bc53386805f1dade7a --- /dev/null +++ b/resid_post_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_18_width_262k_l0_small/config.json b/resid_post_all/layer_18_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ca27dfa2a760f40641f8a6cce27e08410392061 --- /dev/null +++ b/resid_post_all/layer_18_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.output", + "hf_hook_point_out": "model.layers.18.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_16k_l0_small/config.json b/resid_post_all/layer_1_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..933fe703ba20dedd8a0bf3052c701d9eb2e31332 --- /dev/null +++ b/resid_post_all/layer_1_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_1_width_262k_l0_big/config.json b/resid_post_all/layer_1_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..659161572f8205b669bb181461415f8299154c1a --- /dev/null +++ b/resid_post_all/layer_1_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.1.output", + "hf_hook_point_out": "model.layers.1.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 65, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_16k_l0_small/config.json b/resid_post_all/layer_20_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ba7a1dcc770b2036c6cf60b016bad5d28314b4a8 --- /dev/null +++ b/resid_post_all/layer_20_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_20_width_262k_l0_small/config.json b/resid_post_all/layer_20_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6814cf6bebc746dac9eab9fd1cb128d1cb9483d --- /dev/null +++ b/resid_post_all/layer_20_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.20.output", + "hf_hook_point_out": "model.layers.20.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_big/config.json b/resid_post_all/layer_21_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..28e95edce9bf3f27bb0c6c13e1b2ea0ab9fa82db --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_21_width_262k_l0_small/config.json b/resid_post_all/layer_21_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8cf1593c3d63b5d7f830a34aa0aeae079a2877ac --- /dev/null +++ b/resid_post_all/layer_21_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.output", + "hf_hook_point_out": "model.layers.21.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_16k_l0_small/config.json b/resid_post_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..98d279f9aeef4dad20078a389231846641b77bbb --- /dev/null +++ b/resid_post_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_22_width_262k_l0_big/config.json b/resid_post_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5e26ef5f7af843e617ee06179874598c26731150 --- /dev/null +++ b/resid_post_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.output", + "hf_hook_point_out": "model.layers.22.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_big/config.json b/resid_post_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e6fe8ad1e757b337ccb0f5df006d44702e00093c --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_23_width_262k_l0_small/config.json b/resid_post_all/layer_23_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..78495d686ffb899bf8ff68303aed63804335472f --- /dev/null +++ b/resid_post_all/layer_23_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.output", + "hf_hook_point_out": "model.layers.23.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_25_width_262k_l0_big/config.json b/resid_post_all/layer_25_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..63a715216ee7cfa3ee3f4559c180ffc99fd081ba --- /dev/null +++ b/resid_post_all/layer_25_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.output", + "hf_hook_point_out": "model.layers.25.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_26_width_262k_l0_small/config.json b/resid_post_all/layer_26_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..784d635a256d9fa0f621645c7e8fe118e728d2d0 --- /dev/null +++ b/resid_post_all/layer_26_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.output", + "hf_hook_point_out": "model.layers.26.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_27_width_16k_l0_big/config.json b/resid_post_all/layer_27_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2b92271f6a7b2a671fa6c47f0747e98907624e51 --- /dev/null +++ b/resid_post_all/layer_27_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.output", + "hf_hook_point_out": "model.layers.27.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_27_width_16k_l0_small/config.json b/resid_post_all/layer_27_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a11755ecc36c4f9cf9b7bf5e6f738f9c269b1942 --- /dev/null +++ b/resid_post_all/layer_27_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.27.output", + "hf_hook_point_out": "model.layers.27.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_28_width_16k_l0_big/config.json b/resid_post_all/layer_28_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..75b8d74cbb530f79e983c0ba7b9c320b2a069245 --- /dev/null +++ b/resid_post_all/layer_28_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.output", + "hf_hook_point_out": "model.layers.28.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_28_width_262k_l0_big/config.json b/resid_post_all/layer_28_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fdb731a362a126fa382fcaba3f5d2843b42e39b9 --- /dev/null +++ b/resid_post_all/layer_28_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.output", + "hf_hook_point_out": "model.layers.28.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_28_width_262k_l0_small/config.json b/resid_post_all/layer_28_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1321168f9fe4641fdfbc29c7c8c6c135fb69f5b1 --- /dev/null +++ b/resid_post_all/layer_28_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.output", + "hf_hook_point_out": "model.layers.28.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_29_width_16k_l0_small/config.json b/resid_post_all/layer_29_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e77c58a885087f4b5a5c0c31cfc1e027b38d2375 --- /dev/null +++ b/resid_post_all/layer_29_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_29_width_262k_l0_big/config.json b/resid_post_all/layer_29_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8b958e3cdac22d6eb8128b65ff3fb290ae669c03 --- /dev/null +++ b/resid_post_all/layer_29_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.output", + "hf_hook_point_out": "model.layers.29.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_big/config.json b/resid_post_all/layer_2_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d0a0dce7bb15b4ee11c7ef085601dc9fc3692f5 --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 70, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_16k_l0_small/config.json b/resid_post_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..32988c5b9abea42396f49dd22f4b787cab0745bf --- /dev/null +++ b/resid_post_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_2_width_262k_l0_big/config.json b/resid_post_all/layer_2_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..844169ddaf82afb604e0a12624bfa91fd12faa97 --- /dev/null +++ b/resid_post_all/layer_2_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.output", + "hf_hook_point_out": "model.layers.2.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 70, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_30_width_16k_l0_small/config.json b/resid_post_all/layer_30_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..95ddbc4f7cae4acd3eed239951dcd83aa00c1d2a --- /dev/null +++ b/resid_post_all/layer_30_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.output", + "hf_hook_point_out": "model.layers.30.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_31_width_16k_l0_small/config.json b/resid_post_all/layer_31_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6bf37ae69b0a2c35c304ea95c7985810c8dc8ad7 --- /dev/null +++ b/resid_post_all/layer_31_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.output", + "hf_hook_point_out": "model.layers.31.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_33_width_16k_l0_big/config.json b/resid_post_all/layer_33_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..855d46933856d13c87a234cbee8258382bfd8c91 --- /dev/null +++ b/resid_post_all/layer_33_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.output", + "hf_hook_point_out": "model.layers.33.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_33_width_16k_l0_small/config.json b/resid_post_all/layer_33_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1cbcf69292cf6b6c65b80b2e84e87b897b4283cb --- /dev/null +++ b/resid_post_all/layer_33_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.33.output", + "hf_hook_point_out": "model.layers.33.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_3_width_16k_l0_small/config.json b/resid_post_all/layer_3_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2b915f2b2b2f1bd3cd548fdf7fab4e8c18ef4fa4 --- /dev/null +++ b/resid_post_all/layer_3_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.output", + "hf_hook_point_out": "model.layers.3.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 12, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_16k_l0_small/config.json b/resid_post_all/layer_4_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a05caa1d162968ffaff87cce7f0c176dea30f130 --- /dev/null +++ b/resid_post_all/layer_4_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_4_width_262k_l0_small/config.json b/resid_post_all/layer_4_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..daa8c9f4dd809e5a9147ca4c43cba0e7614dca28 --- /dev/null +++ b/resid_post_all/layer_4_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.4.output", + "hf_hook_point_out": "model.layers.4.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_16k_l0_small/config.json b/resid_post_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7d417cdc676ebc103b22d30192980eba20e3dcb8 --- /dev/null +++ b/resid_post_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_5_width_262k_l0_small/config.json b/resid_post_all/layer_5_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..166b1f0bbddce61e2754c9e16f1b11cdc23e2f31 --- /dev/null +++ b/resid_post_all/layer_5_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.output", + "hf_hook_point_out": "model.layers.5.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 14, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_big/config.json b/resid_post_all/layer_6_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..24e50e46d86551e820278ed11e0cf79e52bcc3e0 --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 91, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_16k_l0_small/config.json b/resid_post_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..69a2570664e5699ace6626346b4caf5e0ac98d47 --- /dev/null +++ b/resid_post_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 16384, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_big/config.json b/resid_post_all/layer_6_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d4f1120aecb9f723324dd98d16a11cecff2ef1ea --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 91, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_6_width_262k_l0_small/config.json b/resid_post_all/layer_6_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a5482ee1f06e0a2a5ffdfc85a8b64764b6741d41 --- /dev/null +++ b/resid_post_all/layer_6_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.output", + "hf_hook_point_out": "model.layers.6.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_262k_l0_big/config.json b/resid_post_all/layer_7_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ec3dfa3ab8ec822f0d52ca7ba9340f901d6a5e63 --- /dev/null +++ b/resid_post_all/layer_7_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 97, + "affine_connection": false +} \ No newline at end of file diff --git a/resid_post_all/layer_7_width_262k_l0_small/config.json b/resid_post_all/layer_7_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7c7c241775c4a425b611719a4c7fd8e52a72ac --- /dev/null +++ b/resid_post_all/layer_7_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.output", + "hf_hook_point_out": "model.layers.7.output", + "width": 262144, + "model_name": "gemma-v3-4b-it", + "architecture": "jump_relu", + "l0": 16, + "affine_connection": false +} \ No newline at end of file