3719d13
1
2
3
4
5
6
7
8
9
10
11
12
13
{ "vocab_size": 50257, "dim": 256, "n_layers": 4, "n_heads": 4, "max_seq_len": 512, "architecture": "DeepSeekTransformer", "components": [ "RMSNorm", "RoPE", "SwiGLU" ] }