Llava_Next_VLTopKSAE_8 / config.json
Mayfull's picture
Training in progress, step 10000
69cfc03 verified
raw
history blame contribute delete
321 Bytes
{
"architectures": [
"VLTopKSAE"
],
"dtype": "float32",
"expansion_factor": 32,
"hidden_size": 4096,
"k": 256,
"latent_size": 131072,
"model_type": "vl_topk_sae",
"multi_topk": false,
"normalize_decoder": true,
"transformers_version": "4.57.6",
"vl_split_ratio": [
12,
8,
12
]
}