{ "vocab_size": 50257, "dim": 256, "n_layers": 4, "n_heads": 4, "max_seq_len": 512, "architecture": "DeepSeekTransformer", "components": [ "RMSNorm", "RoPE", "SwiGLU" ] }