{ "vocab_size": 50257, "d_model": 1024, "n_heads": 16, "n_layers": 24, "d_ff": 4096, "max_seq_len": 1024, "dropout": 0.1 }