| {"device": "cuda:0", "dtype": "torch.float32", "seed": 42, "model_name": "meta-llama/Llama-3.2-1B", "d_in": 2048, "d_latent": 7100, "n_layers": 16, "jumprelu_bandwidth": 1.0, "jumprelu_init_threshold": 0.03, "normalize_decoder": false, "dead_feature_window": 250, "cross_layer_decoders": true, "context_size": 16, "functional_loss": "kl", "l0_coefficient": 30.0, "ddp": true, "fsdp": false} |