SLM / config.json
Rahulwale12's picture
Add CPU-optimized quantized SLM model
4918845 verified
{
"model_type": "transformer_lite",
"architectures": [
"TransformerLite"
],
"vocab_size": 12288,
"hidden_size": 128,
"num_hidden_layers": 2,
"num_attention_heads": 4,
"intermediate_size": 512,
"max_position_embeddings": 64,
"quantization_bits": 8,
"model_format": "quantized",
"framework": "pytorch",
"device": "cpu"
}