tinystories-25m / config.json
epoyraz's picture
Upgrade to modded+Muon+zero-init checkpoint (val 2.65 -> 2.40)
4cae3f7 verified
{
"vocab_size": 16384,
"block_size": 256,
"n_embd": 384,
"n_head": 6,
"n_layer": 8,
"use_rope": true,
"n_kv_head": 2,
"use_swiglu": false,
"use_rmsnorm": true,
"use_mtp": true,
"mtp_heads": 2,
"mtp_weight": 0.1,
"tie_mtp_lm_head": true,
"use_relu2": true,
"use_qk_norm": true,
"logit_cap": 15.0,
"use_zero_init": true
}