| { | |
| "trainer": { | |
| "trainer_class": "TrainerTopK", | |
| "dict_class": "AutoEncoderTopK", | |
| "lr": 0.00032659863237109043, | |
| "steps": 30000, | |
| "seed": null, | |
| "activation_dim": 768, | |
| "dict_size": 6144, | |
| "k": 30, | |
| "device": "cuda", | |
| "layer": "0", | |
| "lm_name": "TinyModel_2L_3E", | |
| "wandb_name": "AutoEncoderTopK", | |
| "submodule_name": null | |
| }, | |
| "buffer": { | |
| "d_submodule": 768, | |
| "io": "out", | |
| "n_ctxs": 30000.0, | |
| "ctx_len": 128, | |
| "refresh_batch_size": 512, | |
| "out_batch_size": 8192, | |
| "device": "cuda" | |
| } | |
| } |