Add files using upload-large-folder tool
Browse files- clt/width_262k_l0_big/config.json +9 -0
- clt/width_262k_l0_big_affine/config.json +9 -0
- clt/width_262k_l0_medium/config.json +9 -0
- clt/width_262k_l0_medium/params_layer_14.safetensors +3 -0
- clt/width_262k_l0_medium/params_layer_2.safetensors +3 -0
- clt/width_262k_l0_medium/params_layer_24.safetensors +3 -0
- clt/width_262k_l0_medium_affine/config.json +9 -0
- clt/width_524k_l0_big/config.json +9 -0
- clt/width_524k_l0_big_affine/config.json +9 -0
- clt/width_524k_l0_medium/config.json +9 -0
- clt/width_524k_l0_medium_affine/config.json +9 -0
- clt/width_524k_l0_medium_affine/params_layer_11.safetensors +3 -0
- clt/width_524k_l0_medium_affine/params_layer_12.safetensors +3 -0
- clt/width_524k_l0_medium_affine/params_layer_19.safetensors +3 -0
- clt/width_524k_l0_medium_affine/params_layer_7.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_1m_l0_medium/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_big/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_medium/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_big/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_medium/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_big/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_3.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_medium/config.json +9 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_0.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_1.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_2.safetensors +3 -0
- crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_3.safetensors +3 -0
clt/width_262k_l0_big/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 262080,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
clt/width_262k_l0_big_affine/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 262080,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": true
|
| 9 |
+
}
|
clt/width_262k_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 262080,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
clt/width_262k_l0_medium/params_layer_14.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5138b7b0143d0142f5403ecaa7c6638f5d0a8e8f3d26f4df737b93d2fb160ba
|
| 3 |
+
size 1254198912
|
clt/width_262k_l0_medium/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9ec7c490a861e3bff9bba0b43c0ce43f107d0f439f4cfbafef6dfb1beeb2e65
|
| 3 |
+
size 1254198912
|
clt/width_262k_l0_medium/params_layer_24.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:832c86300a8adeed2b4adbbd6009bcca7f7ff4d43dcd1dc621e1b4840133f0e6
|
| 3 |
+
size 1254198912
|
clt/width_262k_l0_medium_affine/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 262080,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": true
|
| 9 |
+
}
|
clt/width_524k_l0_big/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 524160,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
clt/width_524k_l0_big_affine/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 524160,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": true
|
| 9 |
+
}
|
clt/width_524k_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 524160,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
clt/width_524k_l0_medium_affine/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{all}.pre_feedforward_layernorm.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{all}.post_feedforward_layernorm.output",
|
| 4 |
+
"width": 524160,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": true
|
| 9 |
+
}
|
clt/width_524k_l0_medium_affine/params_layer_11.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:417f0d9d0257f61ab510f6386427a170077c97bc97ffc76e3f79f407b1807c8a
|
| 3 |
+
size 2513701352
|
clt/width_524k_l0_medium_affine/params_layer_12.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6dabc14c9e745d8af55f7daaadca6864d5289d0c57bf68fab165eb6ae614bdd2
|
| 3 |
+
size 2513701352
|
clt/width_524k_l0_medium_affine/params_layer_19.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:249a365ae9f57667c473778dcca9aa300cfdd767ecde1180f8461560cae831c9
|
| 3 |
+
size 2513701352
|
clt/width_524k_l0_medium_affine/params_layer_7.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:521a6fd30db2142435859e183dbc1b2980a3dea01f06a3a723ff2858dd50117a
|
| 3 |
+
size 2513701352
|
crosscoder/layer_7_13_17_22_width_1m_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 1048576,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6bd269aeaf5256ac5f026f3902ccc8e977e8d1ded14c6e9f325c96d7a00df96
|
| 3 |
+
size 6041899912
|
crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f16eae6889e7cac4c3782e4376c67dddcbd45d7be699019f202ba40b8c11ed90
|
| 3 |
+
size 6041899912
|
crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:311d641e9b8435af0c0408e2fdff308467f763eea748d03243a4e555ba3851e3
|
| 3 |
+
size 6041899912
|
crosscoder/layer_7_13_17_22_width_1m_l0_medium/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a56c6a5afe752f800845c7d70bf23e9b8a9169d72810e7f459e08f2167b7665b
|
| 3 |
+
size 6041899912
|
crosscoder/layer_7_13_17_22_width_262k_l0_big/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 262144,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ebbb7076aaaf79160ce630cb6e26e2d4a011c0e06f7a1fdf239ed9f131516da
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07a1f61bbc1241d8e9a790b0e22e7c3e01ae5b4a251832d4fce17dc7f2afb78d
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea72d0bf6555e3e1d2d08141fb98dd303c6a813cb372fc077c041184f4a9b0b6
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_big/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2da0c037047d4b4a8f8ec01bb503ce031f7aec1d14b0a7b1ad5c3ddfa5769989
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 262144,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70e40aded206d47e936bbea84e3fd88970b96148b24192f5fcfd0eaf97ef8365
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3833f55a309797ae26e4ef750677945e7c45b74a8df3595ee6c74abc8101bef7
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25f515e19b0d4303b34045325224f54ae2772ae17adb83a8e7f63a32c1d84fb3
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_262k_l0_medium/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb7c042eed5cf9bd67a41fc8aabb299d5990e7c3092a854ddcaae2e73c40d4cf
|
| 3 |
+
size 1510478720
|
crosscoder/layer_7_13_17_22_width_524k_l0_big/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 524288,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f81595104f5352834156e6053fdfb24f0c0a2c2430c0c23f112812ca3b2b5d7d
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52f7df080166176662defb82b8baf049613786dd339caeb475f88951805fb5c0
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:434ca1eca8642d50baafc9fec3a9f88d6083a5f3a49f0cbfde96c19f7eee894f
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_big/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc5966138ea23d595a06e6a3a31a88088c53d15b1ea6f0fb46a56d55ffad9f76
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 524288,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be60dde5ee67570db13cf31bb224ad6c90e4785f7a667b10ce39cc03b8dab89e
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc1938c6ef836cea43987c304c16eec2735172df93bf12b3534eb5979161961f
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:77c028986c48874f64fa829600e12ac547d418931690451f39e62794bf45aa5a
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_524k_l0_medium/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9dd7a3f33bea7f2710cc7a8564bb9af9e4e43f45430a937b2d4b78cb9c0452f
|
| 3 |
+
size 3020952456
|
crosscoder/layer_7_13_17_22_width_65k_l0_big/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 65536,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 150,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e874f8f0f60be31860e55222609595936fb3985b9c34656c13e019a775bc350
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f56c5ef1e51b24c2db855742446fd4b3c4342e26ca06cbc3b962eb3706d133db
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a47a47689432aedb7c1dadf31a60c31979d75dadf93f437116cd11ffd5d8c0ac
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_big/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1fce4bbe53a76593354e1b5e8c41f1c548e0c8c21b89adf411fa672f44184246
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_medium/config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"hf_hook_point_in": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 3 |
+
"hf_hook_point_out": "model.layers.{7.0,13.5,17.400000000000002,22.599999999999998}.output",
|
| 4 |
+
"width": 65536,
|
| 5 |
+
"model_name": "gemma-v3-1b-it",
|
| 6 |
+
"architecture": "jump_relu",
|
| 7 |
+
"l0": 50,
|
| 8 |
+
"affine_connection": false
|
| 9 |
+
}
|
crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_0.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff610c20469e1f8c37dbbc3507d3b23bae9612879e154ffd5656b4b186b81010
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1918a823777cb3b9cd599c72a22667d490c4da651d3dbf46e4ecb807ac095bc6
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_2.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f8b7a972e8ddc659cd6c9b89b9253c43a2593af0660ecf6da7b1b0d26fd04fd
|
| 3 |
+
size 377623424
|
crosscoder/layer_7_13_17_22_width_65k_l0_medium/params_layer_3.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5cd7d85df5877d5e985e19f39ff03d4a43c574a3f6d19ba4c538a0abbdb04f5c
|
| 3 |
+
size 377623424
|