Coaster41 commited on
Commit
d4d0695
·
verified ·
1 Parent(s): 3b866db

Upload SAE blocks.0.hook_mlp_out

Browse files
blocks.0.hook_mlp_out/cfg.json CHANGED
@@ -1 +1 @@
1
- {"d_in": 256, "d_sae": 8192, "dtype": "float32", "device": "cuda", "apply_b_dec_to_input": false, "normalize_activations": "none", "reshape_activations": "none", "metadata": {"sae_lens_version": "6.5.3", "sae_lens_training_version": "6.5.3", "dataset_path": "autogluon/chronos_datasets", "hook_name": "blocks.0.hook_mlp_out", "model_name": "patchtst_relu", "model_class_name": "HookedTransformer", "hook_head_index": null, "context_size": 512, "num_patches": 32, "seqpos_slice": [null], "model_from_pretrained_kwargs": {"center_writing_weights": false}, "prepend_bos": false, "sequence_separator_token": null, "disable_concat_sequences": false}, "decoder_init_norm": 0.1, "l1_coefficient": 6, "lp_norm": 1.0, "l1_warm_up_steps": 5000, "architecture": "standard"}
 
1
+ {"d_in": 256, "d_sae": 8192, "dtype": "float32", "device": "cuda", "apply_b_dec_to_input": false, "normalize_activations": "none", "reshape_activations": "none", "metadata": {"sae_lens_version": "6.5.3", "sae_lens_training_version": "6.5.3", "dataset_path": "autogluon/chronos_datasets", "hook_name": "blocks.0.hook_mlp_out", "model_name": "patchtst_relu", "model_class_name": "HookedTransformer", "hook_head_index": null, "context_size": 512, "num_patches": 32, "seqpos_slice": [null], "model_from_pretrained_kwargs": {"center_writing_weights": false}, "prepend_bos": false, "sequence_separator_token": null, "disable_concat_sequences": false}, "decoder_init_norm": 0.1, "l1_coefficient": 6, "lp_norm": 1.0, "l1_warm_up_steps": 10000, "architecture": "standard"}
blocks.0.hook_mlp_out/sae_weights.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb52bd0bf714f9a4becc9278a0648ae5495251e9d077d04fdd99b649d5a36505
3
  size 16811312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b23193583341d63b159214e434b04008ae0848ca73173aef654f5da6aa088a5d
3
  size 16811312