diff --git a/mlp_out/layer_12_width_16k_l0_big/config.json b/mlp_out/layer_12_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3f41ba97f1efce306c5852d7c2f1e5bda3d1d152 --- /dev/null +++ b/mlp_out/layer_12_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_16k_l0_medium/config.json b/mlp_out/layer_12_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..994e3137a251664d5fcd5f6f2349021a20b8bb45 --- /dev/null +++ b/mlp_out/layer_12_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_16k_l0_small/config.json b/mlp_out/layer_12_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9435a3de4c347d3ee1c3a9cee56524c401e28bc --- /dev/null +++ b/mlp_out/layer_12_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_262k_l0_big/config.json b/mlp_out/layer_12_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..465c30e5ac459cc7d60ef4912d98c099929df742 --- /dev/null +++ b/mlp_out/layer_12_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_262k_l0_medium/config.json b/mlp_out/layer_12_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..95f7174e8c6899777545527faea75c40201c5f91 --- /dev/null +++ b/mlp_out/layer_12_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_262k_l0_small/config.json b/mlp_out/layer_12_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3ab1dfd4459edc2dbfc764c841dd908387b2caf6 --- /dev/null +++ b/mlp_out/layer_12_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_65k_l0_big/config.json b/mlp_out/layer_12_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a403dec5cc1fe2c8cb28c88675dfc14515cb5291 --- /dev/null +++ b/mlp_out/layer_12_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 127, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_65k_l0_medium/config.json b/mlp_out/layer_12_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..02aebc5ce6a0cdf169dc23c4b8e0682bba63ab4a --- /dev/null +++ b/mlp_out/layer_12_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 52, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_12_width_65k_l0_small/config.json b/mlp_out/layer_12_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..932187514eaa1e5378e087bbef543fee0952fc18 --- /dev/null +++ b/mlp_out/layer_12_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.12.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.12.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 17, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_24_width_16k_l0_big/config.json b/mlp_out/layer_24_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..853f61ead47a0bc708a9310186f98e9a2cf9d79e --- /dev/null +++ b/mlp_out/layer_24_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_24_width_16k_l0_small/config.json b/mlp_out/layer_24_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..151e81812876048056cac351640c4c143980bbec --- /dev/null +++ b/mlp_out/layer_24_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_24_width_65k_l0_small/config.json b/mlp_out/layer_24_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d7fa39117b7832319213dbb014491f019df301cf --- /dev/null +++ b/mlp_out/layer_24_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_31_width_262k_l0_big/config.json b/mlp_out/layer_31_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..25e344d0e6452522b35fe936f4f31196f102d02d --- /dev/null +++ b/mlp_out/layer_31_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_31_width_262k_l0_medium/config.json b/mlp_out/layer_31_width_262k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..35817e2e4436f71ecb4967275f7d81c80f1ff118 --- /dev/null +++ b/mlp_out/layer_31_width_262k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_31_width_65k_l0_big/config.json b/mlp_out/layer_31_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..11746dcc33fe4e95a478e2ab9005cb27140a0729 --- /dev/null +++ b/mlp_out/layer_31_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_31_width_65k_l0_medium/config.json b/mlp_out/layer_31_width_65k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a0e86634e2c65b7dba2c43fb32edb48d7301a7c --- /dev/null +++ b/mlp_out/layer_31_width_65k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_31_width_65k_l0_small/config.json b/mlp_out/layer_31_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..47083e4dfbfedfe78ac8e2e8624d942603976481 --- /dev/null +++ b/mlp_out/layer_31_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_16k_l0_medium/config.json b/mlp_out/layer_41_width_16k_l0_medium/config.json new file mode 100644 index 0000000000000000000000000000000000000000..144b4a011a8d952f994235796a1dfa3ffdbb65be --- /dev/null +++ b/mlp_out/layer_41_width_16k_l0_medium/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_16k_l0_small/config.json b/mlp_out/layer_41_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..180f4cc4bb73fd5e1e9464a5b82d9847625123c2 --- /dev/null +++ b/mlp_out/layer_41_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_262k_l0_big/config.json b/mlp_out/layer_41_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82d047e064cd7ae6f485ccc9be460f2416809295 --- /dev/null +++ b/mlp_out/layer_41_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_262k_l0_small/config.json b/mlp_out/layer_41_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b30a7eaa176b88c5ee866303f9ac53142c1cbb41 --- /dev/null +++ b/mlp_out/layer_41_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_65k_l0_big/config.json b/mlp_out/layer_41_width_65k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbf3e845231a9d9778bd968f02dceb0213bb975 --- /dev/null +++ b/mlp_out/layer_41_width_65k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 150, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out/layer_41_width_65k_l0_small/config.json b/mlp_out/layer_41_width_65k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c48111952ae3e7144e87900d9e141ebabb70393b --- /dev/null +++ b/mlp_out/layer_41_width_65k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 65536, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_16k_l0_big/config.json b/mlp_out_all/layer_0_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..26523bcfd49fec0483f67df7c2463a33a7801f91 --- /dev/null +++ b/mlp_out_all/layer_0_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 60, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_0_width_262k_l0_small/config.json b/mlp_out_all/layer_0_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fecc1424138deac2b6af5d2ab471b6e9353a6a28 --- /dev/null +++ b/mlp_out_all/layer_0_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.0.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.0.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 10, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_10_width_262k_l0_big/config.json b/mlp_out_all/layer_10_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0357c1c361f4a3aab63de9bf13425a213837cfb7 --- /dev/null +++ b/mlp_out_all/layer_10_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.10.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.10.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 97, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_16k_l0_big/config.json b/mlp_out_all/layer_13_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8484b6427a1a2d47e7fcc9b8d5a73e83e7315afc --- /dev/null +++ b/mlp_out_all/layer_13_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 108, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_13_width_262k_l0_small/config.json b/mlp_out_all/layer_13_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..024a0b2632fecd7718b4e177c809b674e5932b7b --- /dev/null +++ b/mlp_out_all/layer_13_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.13.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.13.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 18, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_14_width_16k_l0_big/config.json b/mlp_out_all/layer_14_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..988cae5a3c9f2f737e18db0a9176c5726fc1d91b --- /dev/null +++ b/mlp_out_all/layer_14_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.14.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.14.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 112, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_15_width_262k_l0_big/config.json b/mlp_out_all/layer_15_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..413fd8af9c449f1e33429104d892e3cf1e1de6df --- /dev/null +++ b/mlp_out_all/layer_15_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.15.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.15.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 116, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_16k_l0_big/config.json b/mlp_out_all/layer_16_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fde6f48de8d6f1253c5a1a89e2f1d96db68bd912 --- /dev/null +++ b/mlp_out_all/layer_16_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_16_width_262k_l0_big/config.json b/mlp_out_all/layer_16_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..47b83a348a363d54b5d18b0f746d92ae72ac11ea --- /dev/null +++ b/mlp_out_all/layer_16_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.16.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.16.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_17_width_262k_l0_big/config.json b/mlp_out_all/layer_17_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b8a4835313ed11a96bf716262491409fc5efc40a --- /dev/null +++ b/mlp_out_all/layer_17_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.17.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.17.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_16k_l0_small/config.json b/mlp_out_all/layer_18_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a88f02ec5db0d4d5d01881133df019a34b6702ce --- /dev/null +++ b/mlp_out_all/layer_18_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_18_width_262k_l0_big/config.json b/mlp_out_all/layer_18_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b0eeb8c64d47b36b51f26cca700c04c68f5ba5cb --- /dev/null +++ b/mlp_out_all/layer_18_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.18.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.18.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_21_width_16k_l0_small/config.json b/mlp_out_all/layer_21_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..22e8101650a730d9e5a535b90a1b950b82ac35fe --- /dev/null +++ b/mlp_out_all/layer_21_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.21.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.21.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_16k_l0_small/config.json b/mlp_out_all/layer_22_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..598ad527f68abde790ce270f043dc0a1cb571b66 --- /dev/null +++ b/mlp_out_all/layer_22_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_22_width_262k_l0_big/config.json b/mlp_out_all/layer_22_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d2a138af789f75d61349549b3794fbb64c28d769 --- /dev/null +++ b/mlp_out_all/layer_22_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.22.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.22.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_16k_l0_small/config.json b/mlp_out_all/layer_23_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6a55a06580e14fdd9f8c9f28ddfa9dbeba796609 --- /dev/null +++ b/mlp_out_all/layer_23_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_23_width_262k_l0_big/config.json b/mlp_out_all/layer_23_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d31d390eb9e3523a5fc7c1db6ee19b0eae8a61c1 --- /dev/null +++ b/mlp_out_all/layer_23_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.23.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.23.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_262k_l0_big/config.json b/mlp_out_all/layer_24_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a167011e7bfea360250990a8b77cf77ad5ff4f54 --- /dev/null +++ b/mlp_out_all/layer_24_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_24_width_262k_l0_small/config.json b/mlp_out_all/layer_24_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef39b7d49bbc80811a558aaa8e20c9b822083810 --- /dev/null +++ b/mlp_out_all/layer_24_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.24.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.24.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_25_width_16k_l0_big/config.json b/mlp_out_all/layer_25_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..8a69f90f8217c64b53472d5aab8ef36d52d1e377 --- /dev/null +++ b/mlp_out_all/layer_25_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.25.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.25.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_26_width_16k_l0_small/config.json b/mlp_out_all/layer_26_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3bd7e083117e85d969e62069c3045e001f2fd0fb --- /dev/null +++ b/mlp_out_all/layer_26_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_26_width_262k_l0_small/config.json b/mlp_out_all/layer_26_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b64f8e8ed58d6c2fdcb1a682740ff9a07c00ac79 --- /dev/null +++ b/mlp_out_all/layer_26_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.26.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.26.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_28_width_262k_l0_small/config.json b/mlp_out_all/layer_28_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0ec7640b2d8a20e7e3ba99b32479bfe2c6f1d5b3 --- /dev/null +++ b/mlp_out_all/layer_28_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.28.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.28.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_29_width_262k_l0_big/config.json b/mlp_out_all/layer_29_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b0179c741fbbd15bdf960000c699a4fcb42828f7 --- /dev/null +++ b/mlp_out_all/layer_29_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_29_width_262k_l0_small/config.json b/mlp_out_all/layer_29_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c5263a10d539e654017ea76329648afeab2ea956 --- /dev/null +++ b/mlp_out_all/layer_29_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.29.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.29.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_2_width_16k_l0_small/config.json b/mlp_out_all/layer_2_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..53ed7f51b9d3a89eb2c2c936250989119db12520 --- /dev/null +++ b/mlp_out_all/layer_2_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.2.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.2.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 11, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_30_width_16k_l0_small/config.json b/mlp_out_all/layer_30_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef43511a860e8fc77ddde633846a67069f19e4e0 --- /dev/null +++ b/mlp_out_all/layer_30_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.30.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.30.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_31_width_16k_l0_big/config.json b/mlp_out_all/layer_31_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..316813eb46bdf661095f413e6efd789096f0498c --- /dev/null +++ b/mlp_out_all/layer_31_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_31_width_16k_l0_small/config.json b/mlp_out_all/layer_31_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..6d9872ffefaae6ecceb2052381e622d6c6ff6667 --- /dev/null +++ b/mlp_out_all/layer_31_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_31_width_262k_l0_small/config.json b/mlp_out_all/layer_31_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..45b75ee40db68e94224343d1906899e1da206e9e --- /dev/null +++ b/mlp_out_all/layer_31_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.31.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.31.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_35_width_262k_l0_big/config.json b/mlp_out_all/layer_35_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a4272b9d7473cd19c2a471b8145ecc87ad67ee32 --- /dev/null +++ b/mlp_out_all/layer_35_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.35.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.35.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_36_width_262k_l0_small/config.json b/mlp_out_all/layer_36_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..45570e315fb09ca739df1a796423c46b5e326c5f --- /dev/null +++ b/mlp_out_all/layer_36_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.36.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.36.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_16k_l0_big/config.json b/mlp_out_all/layer_37_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..35eb8ea9d2df1a461687179a77f89b48b819b888 --- /dev/null +++ b/mlp_out_all/layer_37_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_16k_l0_small/config.json b/mlp_out_all/layer_37_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5eb492703279e50f083505123ad0c58ff335d042 --- /dev/null +++ b/mlp_out_all/layer_37_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_37_width_262k_l0_big/config.json b/mlp_out_all/layer_37_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3a5d1d55eb931c7d150c9821cca08ff2152cdb40 --- /dev/null +++ b/mlp_out_all/layer_37_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.37.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.37.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_39_width_262k_l0_big/config.json b/mlp_out_all/layer_39_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3e99238bad1073666cc269e6d2f541eff95de06e --- /dev/null +++ b/mlp_out_all/layer_39_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.39.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.39.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_3_width_262k_l0_big/config.json b/mlp_out_all/layer_3_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..433c7c7ba7123453bbec23043eeef26773d557fd --- /dev/null +++ b/mlp_out_all/layer_3_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.3.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.3.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 71, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_40_width_16k_l0_big/config.json b/mlp_out_all/layer_40_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d3392b8eac6673a691198ee7580a27c2d077ca2 --- /dev/null +++ b/mlp_out_all/layer_40_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_40_width_262k_l0_big/config.json b/mlp_out_all/layer_40_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5b31f6bad017ec6766d4aec233d9d76ba604d8f5 --- /dev/null +++ b/mlp_out_all/layer_40_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.40.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.40.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_41_width_16k_l0_big/config.json b/mlp_out_all/layer_41_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d7056b4dcaa36ba8f57c5f74fc6c9c16ac8b6893 --- /dev/null +++ b/mlp_out_all/layer_41_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.41.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.41.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_42_width_262k_l0_big/config.json b/mlp_out_all/layer_42_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b284c592e3faccf0abb15c3cc14a1b584757dc1c --- /dev/null +++ b/mlp_out_all/layer_42_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.42.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_42_width_262k_l0_small/config.json b/mlp_out_all/layer_42_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..fdbed6598102837ce8240ff9d9ca21daec4eabc0 --- /dev/null +++ b/mlp_out_all/layer_42_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.42.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.42.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_43_width_16k_l0_big/config.json b/mlp_out_all/layer_43_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..43e9e548a6285f43e7d312c4ccc3fbcd87b32bc6 --- /dev/null +++ b/mlp_out_all/layer_43_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.43.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.43.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_45_width_262k_l0_big/config.json b/mlp_out_all/layer_45_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a81e168b733d4b7f407a17c6dc2b8165e3285915 --- /dev/null +++ b/mlp_out_all/layer_45_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.45.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.45.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_46_width_16k_l0_small/config.json b/mlp_out_all/layer_46_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..47ed4f3b5a1e57be173a571e570f4dfbb8240e35 --- /dev/null +++ b/mlp_out_all/layer_46_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.46.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.46.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 20, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_47_width_262k_l0_big/config.json b/mlp_out_all/layer_47_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..041c3722f942e31c8cdeeafa05abb43062c95548 --- /dev/null +++ b/mlp_out_all/layer_47_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.47.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.47.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 120, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_16k_l0_small/config.json b/mlp_out_all/layer_5_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c8e821243ae15ff0f7374327aa7f17c5dc9c5d95 --- /dev/null +++ b/mlp_out_all/layer_5_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_5_width_262k_l0_big/config.json b/mlp_out_all/layer_5_width_262k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..ddf455e3b81ae2afc8c804e7357d5df52e646a57 --- /dev/null +++ b/mlp_out_all/layer_5_width_262k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.5.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.5.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 78, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_6_width_16k_l0_small/config.json b/mlp_out_all/layer_6_width_16k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..20e8f199926488c7be55c35067491b003a43fd41 --- /dev/null +++ b/mlp_out_all/layer_6_width_16k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.6.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.6.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 13, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_7_width_16k_l0_big/config.json b/mlp_out_all/layer_7_width_16k_l0_big/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7116b375f1e57b6d7b87f8b2f57f1a0f4a9fa4d7 --- /dev/null +++ b/mlp_out_all/layer_7_width_16k_l0_big/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.7.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.7.post_feedforward_layernorm.output", + "width": 16384, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 86, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_8_width_262k_l0_small/config.json b/mlp_out_all/layer_8_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b3707c0cf56af9053207ee85c979fa76e85c87f --- /dev/null +++ b/mlp_out_all/layer_8_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.8.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.8.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file diff --git a/mlp_out_all/layer_9_width_262k_l0_small/config.json b/mlp_out_all/layer_9_width_262k_l0_small/config.json new file mode 100644 index 0000000000000000000000000000000000000000..07e59e6d4c9306de61be6f4ad87493e991bd40c3 --- /dev/null +++ b/mlp_out_all/layer_9_width_262k_l0_small/config.json @@ -0,0 +1,9 @@ +{ + "hf_hook_point_in": "model.layers.9.post_feedforward_layernorm.output", + "hf_hook_point_out": "model.layers.9.post_feedforward_layernorm.output", + "width": 262144, + "model_name": "gemma-v3-12b-it", + "architecture": "jump_relu", + "l0": 15, + "affine_connection": false +} \ No newline at end of file