Delete trained_saes

Browse files

Files changed (3) hide show

trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/ae.pt +0 -3
trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/config.json +0 -32
trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/eval_results.json +0 -1

trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/ae.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7fd9e44e2ace29771e0dd496366882948650e4b72fbfa522726eda50261580b0
-size 302066710

trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/config.json DELETED Viewed

@@ -1,32 +0,0 @@
-{
-    "trainer": {
-        "trainer_class": "BatchTopKTrainer",
-        "dict_class": "BatchTopKSAE",
-        "lr": 0.0003,
-        "steps": 2441,
-        "auxk_alpha": 0.03125,
-        "warmup_steps": 1000,
-        "decay_start": 1952,
-        "threshold_beta": 0.999,
-        "threshold_start_step": 1000,
-        "top_k_aux": 1152,
-        "seed": 0,
-        "activation_dim": 2304,
-        "dict_size": 16384,
-        "k": 320,
-        "device": "cuda:6",
-        "layer": 12,
-        "lm_name": "google/gemma-2-2b",
-        "wandb_name": "BatchTopKTrainer-google/gemma-2-2b-resid_post_layer_12_trainer_0",
-        "submodule_name": "resid_post_layer_12"
-    },
-    "buffer": {
-        "d_submodule": 2304,
-        "io": "out",
-        "n_ctxs": 1953,
-        "ctx_len": 128,
-        "refresh_batch_size": 4,
-        "out_batch_size": 2048,
-        "device": "cuda:6"
-    }
-}

trained_saes/batch_top_k/google_gemma-2-2b_batch_top_k/resid_post_layer_12/trainer_0/eval_results.json DELETED Viewed

@@ -1 +0,0 @@

- {"l2_loss": 52.62875, "l1_loss": 1287.76, "l0": 310.368125, "frac_variance_explained": 0.81931640625, "cossim": 0.93048828125, "l2_ratio": 0.92916015625, "relative_reconstruction_bias": 0.99939453125, "loss_original": 2.6491796875, "loss_reconstructed": 3.083125, "loss_zero": 12.4375, "frac_recovered": 0.95533203125, "frac_alive": 0.99993896484375, "hyperparameters": {"n_inputs": 200, "context_length": 128}}