| { | |
| "d_in": 1024, | |
| "d_sae": 16384, | |
| "dtype": "float32", | |
| "device": "cuda", | |
| "jumprelu_init_threshold": 1.0, | |
| "jumprelu_bandwidth": 1.0, | |
| "jumprelu_sparsity_loss_mode": "step", | |
| "l0_coefficient": 1.0, | |
| "l0_warm_up_steps": 0, | |
| "pre_act_loss_coefficient": null, | |
| "jumprelu_tanh_scale": 4.0, | |
| "decoder_init_norm": 0.1 | |
| } |