loaded v18 bin: vocab=128 d_model=256 n_layers=8 n_heads=8 d_ff=512 T_max=256 M=65536