Coaster41 commited on
Commit
ba94f1e
·
verified ·
1 Parent(s): b719a05

Upload SAE blocks.0.hook_mlp_out

Browse files
blocks.0.hook_mlp_out/cfg.json CHANGED
@@ -1 +1 @@
1
- {"d_in": 256, "d_sae": 2048, "dtype": "float32", "device": "cuda", "apply_b_dec_to_input": false, "normalize_activations": "none", "reshape_activations": "none", "metadata": {"sae_lens_version": "6.5.3", "sae_lens_training_version": "6.5.3", "dataset_path": "autogluon/chronos_datasets", "hook_name": "blocks.0.hook_mlp_out", "model_name": "patchtst_relu", "model_class_name": "HookedTransformer", "hook_head_index": null, "context_size": 512, "num_patches": 32, "seqpos_slice": [null], "model_from_pretrained_kwargs": {"center_writing_weights": false}, "prepend_bos": false, "sequence_separator_token": null, "disable_concat_sequences": false}, "decoder_init_norm": 0.1, "l1_coefficient": 6, "lp_norm": 1.0, "l1_warm_up_steps": 3000, "architecture": "standard"}
 
1
+ {"d_in": 256, "d_sae": 2048, "dtype": "float32", "device": "cuda", "apply_b_dec_to_input": false, "normalize_activations": "none", "reshape_activations": "none", "metadata": {"sae_lens_version": "6.5.3", "sae_lens_training_version": "6.5.3", "dataset_path": "autogluon/chronos_datasets", "hook_name": "blocks.0.hook_mlp_out", "model_name": "patchtst_relu", "model_class_name": "HookedTransformer", "hook_head_index": null, "context_size": 512, "num_patches": 32, "seqpos_slice": [null], "model_from_pretrained_kwargs": {"center_writing_weights": false}, "prepend_bos": false, "sequence_separator_token": null, "disable_concat_sequences": false}, "decoder_init_norm": 0.1, "l1_coefficient": 6, "lp_norm": 1.0, "l1_warm_up_steps": 10000, "architecture": "standard"}
blocks.0.hook_mlp_out/sae_weights.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c389bbbc427a5dce8a302528574b1f097b67bf1788d60191e3f9aaf33c104d25
3
  size 4203824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0a6ec80bca71909991ddceba321b9fe6cd2d464bc7d3fc776c9a03b01a4e2e6
3
  size 4203824