chessgpt / config.json
malcouffe's picture
Convert to HuggingFace format (safetensors + trust_remote_code)
1d38600 verified
raw
history blame contribute delete
517 Bytes
{
"auto_map": {
"AutoConfig": "configuration_chessgpt.ChessGPTConfig",
"AutoModelForCausalLM": "modeling_chessgpt.ChessGPTForCausalLM"
},
"bos_token_id": 1,
"d_ff": 3584,
"d_model": 1280,
"dropout": 0.0,
"eos_token_id": 2,
"max_seq_len": 256,
"model_type": "chessgpt",
"n_heads": 20,
"n_layers": 21,
"pad_token_id": 0,
"rms_norm_eps": 1e-06,
"rope_theta": 10000.0,
"tie_word_embeddings": true,
"transformers_version": "5.2.0",
"vocab_size": 4211,
"weight_init_std": 0.02
}