Mayfull's picture
Training in progress, step 886
2200e18 verified
{
"architectures": [
"VLTopKSAE"
],
"dtype": "float32",
"expansion_factor": 16,
"hidden_size": 768,
"k": 32,
"latent_size": 0,
"model_type": "vl_topk_sae",
"multi_topk": false,
"normalize_decoder": true,
"transformers_version": "4.57.6",
"vl_split_ratio": [
2,
12,
2
]
}