SlimMoE-250M-base / config.json
SlimFactory's picture
Upload folder using huggingface_hub
783312e verified
raw
history blame contribute delete
486 Bytes
{
"adaptive_routing": true,
"architectures": [
"SlimMoEForCausalLM"
],
"auto_map": {
"AutoConfig": "configuration_slim_moe.SlimMoEConfig",
"AutoModelForCausalLM": "modeling_slim_moe.SlimMoEForCausalLM"
},
"dim": 768,
"dropout": 0.1,
"hidden_dim": 1536,
"max_seq_len": 2048,
"model_type": "slim_moe",
"num_experts": 4,
"num_heads": 12,
"num_hidden_layers": 16,
"torch_dtype": "float32",
"transformers_version": "4.53.2",
"vocab_size": 50257
}