diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/config.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/config.json deleted file mode 100644 index e602868a7ffb3871ad277c552b85965b53306e0f..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/config.json +++ /dev/null @@ -1 +0,0 @@ -{"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["model.layers.5.mlp", "model.layers.5.post_attention_layernorm", "model.layers.6.mlp", "model.layers.6.post_attention_layernorm", "model.layers.7.mlp", "model.layers.7.post_attention_layernorm", "model.layers.8.mlp", "model.layers.8.post_attention_layernorm", "model.layers.9.mlp", "model.layers.9.post_attention_layernorm", "model.layers.10.mlp", "model.layers.10.post_attention_layernorm", "model.layers.11.mlp", "model.layers.11.post_attention_layernorm", "model.layers.12.mlp", "model.layers.12.post_attention_layernorm", "model.layers.13.mlp", "model.layers.13.post_attention_layernorm", "model.layers.14.mlp", "model.layers.14.post_attention_layernorm", "model.layers.15.mlp", "model.layers.15.post_attention_layernorm", "model.layers.16.mlp", "model.layers.16.post_attention_layernorm", "model.layers.17.mlp", "model.layers.17.post_attention_layernorm", "model.layers.18.mlp", "model.layers.18.post_attention_layernorm", "model.layers.19.mlp", "model.layers.19.post_attention_layernorm"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm2_cs1_experiment_4.3_syn=True/k=128", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/lr_scheduler.pt b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/lr_scheduler.pt deleted file mode 100644 index 1619aeb0b307c4dbe1e57034770cbd69eb75c48b..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/lr_scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0c1a4ccded57e94e581be291e5bc725b8c8e883138bcad563998f929ce54ece4 -size 1652 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/metrics.json deleted file mode 100644 index 60fae66868c7d709830ace1320203cf0cc0bda52..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.011143377050757408, "dead_pct": 0.00758928619325161} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/sae.safetensors deleted file mode 100644 index 201a966cc0bc2a13b129ea5fbab4dfdfe1fd20b5..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:26b70e6030838b0a5139b6d3ad6b6ce3a919ee94dd20ecbca513028fa96adfcc -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/metrics.json deleted file mode 100644 index 718a93c11f2d817935595b3bc14287e2884d4672..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.004017857369035482, "fvu": 0.008762086741626263} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 385db68c8aeb2818409ebd433c3c9b89c75793e1..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.10.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d87920aa769096bb31889dcd100d7760890cb9c65ba7fa49ed4bf74e6ebe798f -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/metrics.json deleted file mode 100644 index c2a513f56eff6642cfe0b421f0cb787ae107cbd1..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.012227058410644531, "dead_pct": 0.0096726194024086} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/sae.safetensors deleted file mode 100644 index 16068bfe82d94790d5bc287b4a4f66725a92630e..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:00530f95e7f09543bedf83233ad4adeba0d0adf97a619d8ebed51aa1128077da -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/metrics.json deleted file mode 100644 index bfe421648d5a157a6287aa01aaed01e46a198728..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.00513392873108387, "fvu": 0.010888863354921341} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/sae.safetensors deleted file mode 100644 index b687ea05fc99bdc896af19eb1c3cf0de091f3498..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.11.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e7e6a4919d9b0aeb08d3314734ab3ec46a8978780fd60c0dab53c1acaa1b7749 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/metrics.json deleted file mode 100644 index b75d6bf8ab598166533cce87a2e79c99a24443e2..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.013765087351202965, "dead_pct": 0.007663690950721502} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/sae.safetensors deleted file mode 100644 index c4612b6c4333b6f7d73945b8752b32c5cbd75f67..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e16c225c2d47b5a6615914d8a4e62c7d863373a0fb078c0cc7ff0b1c6d22e20f -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/metrics.json deleted file mode 100644 index 14f38495331fe72aa4ae9e3f53e860ad9741089d..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.010856058448553085, "dead_pct": 0.01004464365541935} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/sae.safetensors deleted file mode 100644 index c3883bdccc426bbe5cd204dc9a9ef7c5a8100b7f..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.12.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7b266fcccbc2a12baeb5e9c14f7434f4c725e4eee7a7c5a23df51d6a6e256f7b -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/metrics.json deleted file mode 100644 index 067424b36940246fe18164a3cba621f957b9d909..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.015192780643701553, "dead_pct": 0.0055059525184333324} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/sae.safetensors deleted file mode 100644 index 721f19ebf150971e7ca5e605bcb1b0407c2ee3e8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fe702ea2a7d8e08337c980bb9eee72d9149c8911166f237721e364b18d250035 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/metrics.json deleted file mode 100644 index 32e5f48fe09fcfd982084c15c07aa0e5683802f0..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.01202225312590599, "dead_pct": 0.01004464365541935} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 59e05a540bcc5cad39a19b2fc1b4d90bcb762ff7..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.13.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c9c78a5bf72a2681a3c85b450b37d11287976c167a19536b8207101ef6105bd -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/metrics.json deleted file mode 100644 index a68a9d2b1c1752f63b37a2676d8e1e07f27a4bcb..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.01987934298813343, "dead_pct": 0.0012648809934034944} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/sae.safetensors deleted file mode 100644 index c6ae82c5575b6b63f01f33e95e32615853d7118d..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a6e3f2d1a8870029e1f3a890637a34c7f65336744156a07a48b7a6c1de1c9117 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/metrics.json deleted file mode 100644 index 2b297543ea3b3ded3f2c87d65217db23cf97c396..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.00907738134264946, "fvu": 0.014239244163036346} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 671c28448daeced1e750bfc8fa5ca243a8077171..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.14.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c71198823012d8575bd5aa4ab8d92ccd37da5b9b265a06498777e0b5624ce0ce -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/metrics.json deleted file mode 100644 index 4ef83d60d3fbfb66c8d31dd9d2c4ff4098a54d9d..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0005208333604969084, "fvu": 0.023401465266942978} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/sae.safetensors deleted file mode 100644 index 085849b56d4dfd7d5ce853614e8c44eb8eba0e84..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:082673861e33fabb4d467840ba2e8598256763dfc348f4647e2760a37cddebbe -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/metrics.json deleted file mode 100644 index 21146e11096bb50c56101252df16376dac619281..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.014060208573937416, "dead_pct": 0.004092262126505375} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 957bb632e1ccef2a7a05e38cb356831a512a7ffd..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.15.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:924e63b29c8a439afdd9f18892fbfe0899b1e0d110307cf54a6043b60afadf41 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/metrics.json deleted file mode 100644 index 50ce5f2a49af81800edc7adaa5865e6d8c7e94cb..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.016603531315922737, "dead_pct": 0.00022321430151350796} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/sae.safetensors deleted file mode 100644 index ae1edb582e60eabb81933fc498584eb2c075f0e8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:14b234d5e11026e3beafd482b1ae7b14571996abc94e5d2b72f92ea83cc74308 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/metrics.json deleted file mode 100644 index a09f3610f55ec91f1fddf1456a18c61d72293adb..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.013535319827497005, "dead_pct": 0.0027529762592166662} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 5cdcfe002efa0fe5f97c1c7e468c203415537450..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.16.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bdd4138f7126c21b3c2c52502c86a18c7b14d5ce75cf66d5a73d2e75b63e7656 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/metrics.json deleted file mode 100644 index d329672a874e600da2caa779719f9916cadc1ad5..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0014136905083432794, "fvu": 0.011707901023328304} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/sae.safetensors deleted file mode 100644 index b3217fa00a2766b035bdecddb0a3ec0c81a29196..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5d31d0403c99aeacbb92a2b74e829a0edf56793ff0136d6c6f7f4ace994546c8 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/metrics.json deleted file mode 100644 index af206c19a7ffa6a7b9c4f92512df70ac1ba5c36e..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.011492160148918629, "dead_pct": 0.002306547714397311} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 7c5d0c11d9d84ad7e3778002e4661044324a5ce8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.17.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:526f3402b3c6843b76fe8e83f1159fe894f13254d252872ff8ae0be67c7ac82b -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/metrics.json deleted file mode 100644 index ed252d7c518d1c5f687e53529c0ee1bd44dca06d..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0, "fvu": 0.015863902866840363} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/sae.safetensors deleted file mode 100644 index 11930d32b6b25474fc610d319459f24fa1dbc9d6..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c5f0d3424871b23a14367deddadf769138093b8a7648ee901858f3adf5311a67 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/metrics.json deleted file mode 100644 index 8d7e6f7a5af2692e5d864769e52fac3c33904c11..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0006696428754366934, "fvu": 0.012910332530736923} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 412ca3c5f20ee35f16816cb2d1827ebf8e755415..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.18.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a8d71c249d55d4d0a963a70a88d3f567c1da64a7941ef39e6d53098024e447a2 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/metrics.json deleted file mode 100644 index 49a939119a919940e345e7c0a939085033d24e64..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.00014880952949170023, "fvu": 0.015174311585724354} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/sae.safetensors deleted file mode 100644 index 9066824347dcde625f712b71ed63532dec51c0d8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e306994a36b48445298deefee7782c59af463e613b0996bc62a77b5fce83f2c -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/metrics.json deleted file mode 100644 index 6b86ac04be85246f02d8d84d97e6f4f54e2e0830..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.011404115706682205, "dead_pct": 7.440476474585012e-05} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/sae.safetensors deleted file mode 100644 index ec3e70686b088c410ba91202112562b83c8f2e71..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.19.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d0af0d62ad16102b412e41fb06c4339b58531062aa0ed364e029d3209cc6f186 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/metrics.json deleted file mode 100644 index 3e80563caadbf05465795c3d3d8f1d7e973c4cee..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.004711732268333435, "dead_pct": 0.006473214365541935} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/sae.safetensors deleted file mode 100644 index affed3f4db3d562bbf276f718ace00557ee49db6..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ac68bb6d08d1487e7e063259dde4a65134a8dc1a68c54d6211cb205c9b7cf52b -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/metrics.json deleted file mode 100644 index 8ac6d24954b8a4b20a3783a29ab26ce4547f2b3c..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.005395248997956514, "dead_pct": 0.0016369047807529569} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 66790f388c1f2dba516fdde5cda71a10b91cfd73..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.5.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:500119928adbd83ff45f02fcb588512ff28094036d8f32b8f94432188ea53577 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/metrics.json deleted file mode 100644 index 3413e5365a254fe851cece95e0da8eda802a0443..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0020833334419876337, "fvu": 0.008038644678890705} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/sae.safetensors deleted file mode 100644 index 39eaf1f5c6bd0eaa4836dd28cf5e63ab17f4073b..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7fd5b2cce386597957af3ebb6f1ddf26950a6174022d3535674f13a7ff120e7a -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/metrics.json deleted file mode 100644 index fa8be551a09935422fffd95511165d7d1c615b00..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.002008928684517741, "fvu": 0.005864235106855631} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 775b6e7e45b20098a77da55514415277f91d7716..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.6.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5a41496fc546d36e80b0e506d3ad6f356f56f64278ff51421c282aed98b12775 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/metrics.json deleted file mode 100644 index d9d020075b44270539241d4cb2a04aaf795bf1e2..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.008542937226593494, "dead_pct": 0.002455357229337096} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/sae.safetensors deleted file mode 100644 index b710b476b3e50006b6436a2c0336c910a41ec30b..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d16148199142a6c0fdbd3e9474ea6be1587c43ae6a2a08bb8fb31a474baa2237 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/metrics.json deleted file mode 100644 index ac24a1cbf020878d6d09f674ee94ce2425b88a57..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.005462926346808672, "dead_pct": 0.0009672619635239244} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/sae.safetensors deleted file mode 100644 index d0a34a7308e0800496708350afc886bece065001..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.7.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5d65af97d49b20a545c511a64549524a6e86286eb37799e95023f5204e2771cf -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/metrics.json deleted file mode 100644 index a38c120e6cb5d5624915423ede87dd3fb9b34c33..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.008527319878339767, "dead_pct": 0.0048363097012043} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/sae.safetensors deleted file mode 100644 index 87bcc0926fdb4cc0103326fca9e560f05dbe99f3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6ceb1a264b3b6822b51ddd5de84d4ec3359c7d22241c0bd8d17b8e487157092 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/metrics.json deleted file mode 100644 index beddb13b0cf9177b96978a55e51e6bb60d730ee2..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0025297619868069887, "fvu": 0.005849564913660288} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 696d12ff3cae0df88402f7cb820ce4cf26a2a7be..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.8.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c1e24c674738b7644bc469e46f31b9ca1039b161d5bcb77cb5ba27394eebca72 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/metrics.json deleted file mode 100644 index c5f7d43fb66b2dc96df1aecf4492f4e7d8b6cbf6..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0031994048040360212, "fvu": 0.010036525316536427} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/sae.safetensors deleted file mode 100644 index b99b2d6d77d275474afc348bf447b5000db8e63f..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a1a97bf21a31f90a51e34caf9d333560ac6c2cd2b749fea3ac5b138e897ba9be -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/cfg.json deleted file mode 100644 index 8655981effb80369bfa02540354ed1ea53920cf3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/metrics.json deleted file mode 100644 index 7877c590022d232c6fb6643af7531f3305fc84b9..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0034226190764456987, "fvu": 0.007193866651505232} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 9a29ce5047ae0ab6932d0306e6a1194d683223e0..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model.layers.9.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fd81271e973a4ebcffacde5d9517e3f05c30568531ff4cf44437c2fbb12fcdcd -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model_config.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model_config.json deleted file mode 100644 index a96bcf4f590864a5b571e20ff6dbb25da603f0e4..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/model_config.json +++ /dev/null @@ -1 +0,0 @@ -{"model_name": "withmartian/sql_interp_bm2_cs1_experiment_4.3", "dataset_name": "withmartian/cs1_dataset_synonyms", "model_abbrev": "saes_sql_interp_bm2_cs1_experiment_4.3_syn=True"} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/state.pt b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/state.pt deleted file mode 100644 index f864d3a295c1411f4392132d5ecb21a314b734ed..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=128/state.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d5bebb4e2775c1a8899a141974257e76f388280211e3f04ca2424442695d52f3 -size 3233272 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/config.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/config.json deleted file mode 100644 index 395b6495bb8945c0298bdc77c7365079a09dccf5..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/config.json +++ /dev/null @@ -1 +0,0 @@ -{"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["model.layers.5.mlp", "model.layers.5.post_attention_layernorm", "model.layers.6.mlp", "model.layers.6.post_attention_layernorm", "model.layers.7.mlp", "model.layers.7.post_attention_layernorm", "model.layers.8.mlp", "model.layers.8.post_attention_layernorm", "model.layers.9.mlp", "model.layers.9.post_attention_layernorm", "model.layers.10.mlp", "model.layers.10.post_attention_layernorm", "model.layers.11.mlp", "model.layers.11.post_attention_layernorm", "model.layers.12.mlp", "model.layers.12.post_attention_layernorm", "model.layers.13.mlp", "model.layers.13.post_attention_layernorm", "model.layers.14.mlp", "model.layers.14.post_attention_layernorm", "model.layers.15.mlp", "model.layers.15.post_attention_layernorm", "model.layers.16.mlp", "model.layers.16.post_attention_layernorm", "model.layers.17.mlp", "model.layers.17.post_attention_layernorm", "model.layers.18.mlp", "model.layers.18.post_attention_layernorm", "model.layers.19.mlp", "model.layers.19.post_attention_layernorm"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm2_cs1_experiment_4.3_syn=True/k=256", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/lr_scheduler.pt b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/lr_scheduler.pt deleted file mode 100644 index 4dceeaf3df0b35c80daf7324b1896244d7b14f52..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/lr_scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c342c3270b5cc3fc57fef361246a67b03ad4c70ca9b2820108ee95d3b45d568e -size 1652 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/metrics.json deleted file mode 100644 index 0641464e01d2f7bd814c9950abf92667feb9ba64..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.007389636244624853, "dead_pct": 0.005059523973613977} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/sae.safetensors deleted file mode 100644 index 889f9333ec490494005e696b875f0bbb287c1b70..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.mlp/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5b40a68aea0d43a106de8eb009b3238e731de4447307d08cb99a5612889df16a -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/metrics.json deleted file mode 100644 index fafce64beef9fb5b45ccc17cad9a051c25874070..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.005201994441449642, "dead_pct": 0.0014880952658131719} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/sae.safetensors b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/sae.safetensors deleted file mode 100644 index 859289475491146fd8f1596d5307e560aab6fb78..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.10.post_attention_layernorm/sae.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:87c7957f5eb7fb9bf98b6b5491f893a593f0795ade55dcb1adb17dd67bb62209 -size 96395592 diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/metrics.json deleted file mode 100644 index 2a5a74f44a51718a72d9e450a0f91f8f81150574..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0078125, "fvu": 0.006918993778526783} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/metrics.json deleted file mode 100644 index 6b53226fa79606977aa1316c59f874c69c3d93d8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.11.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.0065234145149588585, "dead_pct": 0.002455357229337096} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/metrics.json deleted file mode 100644 index 5bb7f57931878ca608dbfeb725b81610572ee20b..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.007560656871646643, "dead_pct": 0.0061011905781924725} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/metrics.json deleted file mode 100644 index 6d5b38a8de589b6922647779fe2086fa8bcd2fc3..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.12.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.006123366300016642, "dead_pct": 0.00364583358168602} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/metrics.json deleted file mode 100644 index 6dcabb12b8b68ce86494e72528da7050ea4a5707..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.010443536564707756, "dead_pct": 0.0017113095382228494} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/metrics.json deleted file mode 100644 index fd49e2ab3c91e93dbf1e111d48dfcf15956af963..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.13.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.002455357229337096, "fvu": 0.009360969997942448} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/metrics.json deleted file mode 100644 index 720f87c5d954793dba426c76842e90328f97cb03..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.00029761905898340046, "fvu": 0.011759531684219837} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/metrics.json deleted file mode 100644 index 8a5a5c5ebf879e3324d8458a48479eb128c5b6b5..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.14.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0011160714784637094, "fvu": 0.007400806527584791} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/metrics.json deleted file mode 100644 index e851da25ab43b6d9bb501c37b21ee98022cb67e2..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.01267997082322836, "dead_pct": 0.00022321430151350796} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/metrics.json deleted file mode 100644 index 0196b413d0dce982f902e0b26601dc8fbaa25992..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.15.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.009873402304947376, "dead_pct": 0.0006696428754366934} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/metrics.json deleted file mode 100644 index eac74d6b266ddc02fd8a3dcb3b6a04ce9a81c317..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0, "fvu": 0.012106050737202168} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/metrics.json deleted file mode 100644 index 6085913f8739ee1a77bfef7d9ad15a1276ab01bb..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.16.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.00029761905898340046, "fvu": 0.0077447108924388885} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/metrics.json deleted file mode 100644 index 295f6addbb5fab4f54a773c17cf31e8b655e2de8..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.008571564219892025, "dead_pct": 0.0} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/metrics.json deleted file mode 100644 index a535c5c5437f95d9b55e029c2d5efea81287fdf9..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.17.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 0.0, "fvu": 0.0074108862318098545} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.mlp/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.mlp/metrics.json deleted file mode 100644 index 05c7ce0abca2bde9e708e24316d4dbb2f509bf0a..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.mlp/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"fvu": 0.011035350151360035, "dead_pct": 0.0} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/cfg.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/cfg.json deleted file mode 100644 index 9a6f583aca1e21b0652587d5f8094c04fa7d7325..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/cfg.json +++ /dev/null @@ -1 +0,0 @@ -{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 896} \ No newline at end of file diff --git a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/metrics.json b/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/metrics.json deleted file mode 100644 index 016fe9fbf34bc786f18cd8ad58b6985e992cecb5..0000000000000000000000000000000000000000 --- a/saes_sql_interp_bm2_cs1_experiment_430_syn=True/k=256/model.layers.18.post_attention_layernorm/metrics.json +++ /dev/null @@ -1 +0,0 @@ -{"dead_pct": 7.440476474585012e-05, "fvu": 0.008274384774267673} \ No newline at end of file