Mayfull's picture
Training in progress, step 10000
751475d verified
raw
history blame contribute delete
320 Bytes
{
"architectures": [
"VLTopKSAE"
],
"dtype": "float32",
"expansion_factor": 32,
"hidden_size": 4096,
"k": 256,
"latent_size": 131072,
"model_type": "vl_topk_sae",
"multi_topk": false,
"normalize_decoder": true,
"transformers_version": "4.57.6",
"vl_split_ratio": [
4,
24,
4
]
}