{ "format_version": 1, "checkpoint_type": "pretrain", "model_config": { "vocab_size": 4278, "max_seq_len": 256, "n_outcomes": 5, "d_model": 512, "n_layers": 8, "n_heads": 8, "d_ff": 2048, "dropout": 0.0, "rope_base": 10000.0 }, "training_config": { "lr": 0.0003, "weight_decay": 0.01, "max_grad_norm": 1.0, "warmup_steps": 1000, "total_steps": 100000, "batch_size": 256, "max_ply": 256, "discard_ply_limit": false, "num_workers": 4, "use_amp": true, "accumulation_steps": 1, "log_interval": 10, "eval_interval": 500, "checkpoint_interval": 5000, "base_seed": 42, "val_seed": 9223372036854775807, "val_games": 512, "checkpoint_dir": "logs/run_20260322_182707/checkpoints", "log_dir": "logs", "use_wandb": false, "wandb_project": "pawn", "device": "cuda" } }