| { | |
| "model_id": "smallthinker_3b", | |
| "model_arch": "qwen2", | |
| "version": 20241202, | |
| "llm_config": { | |
| "embed_dim": 2048, | |
| "ffn_dim": 11008, | |
| "head_size": 128, | |
| "kv_dim": 256, | |
| "n_attn_heads": 16, | |
| "n_attn_kv_heads": 2, | |
| "n_ctx": 32768, | |
| "n_layers": 36, | |
| "norm_eps": 9.999999974752427e-07, | |
| "vocab_size": 151936, | |
| "rope_config": { | |
| "n_rope_ctx_orig": 32768, | |
| "rope_attn_factor": 1.0, | |
| "rope_dim": 128, | |
| "rope_freq_base": 1000000.0, | |
| "rope_freq_scale": 1.0, | |
| "rope_scale_type": "linear", | |
| "rope_type": -1 | |
| } | |
| }, | |
| "vision": {} | |
| } |