jacobcd52
/

insecure_diffing

jacobcd52 commited on Mar 1, 2025

Commit

c20a1bd

verified ·

1 Parent(s): 36e9df5

Upload trainer_0/config.json with huggingface_hub

Files changed (1) hide show

trainer_0/config.json CHANGED Viewed

@@ -7,15 +7,18 @@
         "lr": 1e-06,
         "l1_penalty": 0.01,
         "warmup_steps": 0,
-        "sparsity_warmup_steps": 2000,
-        "steps": 61035,
         "decay_start": null,
         "seed": null,
         "device": "cuda:2",
         "layer": 7,
         "lm_name": "blah",
         "wandb_name": "StandardTrainerAprilUpdate",
-        "submodule_name": null
     },
     "buffer": {
         "n_models": 2,
@@ -23,8 +26,8 @@
         "io": "out",
         "n_ctxs": 512,
         "ctx_len": 256,
-        "refresh_batch_size": 512,
-        "out_batch_size": 8192,
         "device": "cuda:2",
         "rescale_acts": false
     }

         "lr": 1e-06,
         "l1_penalty": 0.01,
         "warmup_steps": 0,
+        "sparsity_warmup_steps": 0,
+        "steps": 30517,
         "decay_start": null,
         "seed": null,
         "device": "cuda:2",
         "layer": 7,
         "lm_name": "blah",
         "wandb_name": "StandardTrainerAprilUpdate",
+        "submodule_name": null,
+        "frac_features_shared": 0.1,
+        "shared_l1_penalty": 0.002,
+        "num_shared_features": 5734
     },
     "buffer": {
         "n_models": 2,
         "io": "out",
         "n_ctxs": 512,
         "ctx_len": 256,
+        "refresh_batch_size": 1024,
+        "out_batch_size": 16384,
         "device": "cuda:2",
         "rescale_acts": false
     }