chess-transformer-200m / config.json
avewright's picture
Upload config.json with huggingface_hub
d8a3c12 verified
raw
history blame contribute delete
516 Bytes
{
"architecture": "ChessTransformer200M",
"params": 204006404,
"encoder_dim": 256,
"hidden_dim": 1024,
"num_layers": 16,
"num_heads": 16,
"ffn_ratio": 4,
"policy_head_dim": 512,
"value_hidden": 512,
"vocab_size": 5504,
"training": {
"steps": 10000,
"positions_seen": 10240256,
"batch_size": 256,
"accum_steps": 4,
"effective_batch": 1024,
"lr": 0.0002,
"best_accuracy": 0.184,
"dataset": "avewright/chess-positions-lichess-sf",
"gpu": "NVIDIA A40 46GB"
}
}