DevStudio-Coder-1.5B-MLC / mlc-chat-config.json
devstudio-live's picture
Add MLC/WebGPU compiled model for WebLLM
638cba9 verified
raw
history blame
526 Bytes
{
"model_id": "DevStudio-Coder-1.5B-q4f16_1-MLC",
"model_type": "qwen2",
"hidden_act": "silu",
"hidden_size": 1536,
"intermediate_size": 8960,
"num_attention_heads": 12,
"num_hidden_layers": 28,
"num_key_value_heads": 2,
"rms_norm_eps": 1e-6,
"rope_theta": 1000000.0,
"vocab_size": 151936,
"tokenizer_files": ["tokenizer.json", "tokenizer_config.json"],
"conv_template": "qwen2",
"context_window_size": 4096,
"prefill_chunk_size": 1024,
"sliding_window_size": -1,
"attention_sink_size": -1
}