v1.0.0: searchless_chess vocab, 512 context, 200K steps
Browse filesSquash-merge of run/co_pretraining_2026_04_13 into main.
Replaces the legacy backbone (4,278-token coordinate vocab, 256 context,
prepend_outcome=True, 100K steps) with the v1.0.0 backbone:
- 1,980-token searchless_chess action vocabulary (1,968 reachable actions
+ 1 PAD + 11 outcome tokens)
- 512-token context window
- prepend_outcome=False (no outcome conditioning)
- 200K training steps at batch size 256 (best checkpoint at step 195K)
- 34.65M parameters
Published model.safetensors is the best 5K-cadence checkpoint by val
loss (step 195,000). All intermediate 5K checkpoints are preserved under
checkpoints/ for training-dynamics analysis.
The legacy checkpoint is preserved in the git history of this repo and
is also available at thomas-schweich/pawn-base-legacy.
- checkpoints/step_00005000/.complete +9 -0
- checkpoints/step_00005000/config.json +43 -0
- checkpoints/step_00005000/model.safetensors +3 -0
- checkpoints/step_00005000/optimizer.safetensors +3 -0
- checkpoints/step_00005000/training_state.json +118 -0
- checkpoints/step_00010000/.complete +9 -0
- checkpoints/step_00010000/config.json +43 -0
- checkpoints/step_00010000/model.safetensors +3 -0
- checkpoints/step_00010000/optimizer.safetensors +3 -0
- checkpoints/step_00010000/training_state.json +118 -0
- checkpoints/step_00015000/.complete +9 -0
- checkpoints/step_00015000/config.json +43 -0
- checkpoints/step_00015000/model.safetensors +3 -0
- checkpoints/step_00015000/optimizer.safetensors +3 -0
- checkpoints/step_00015000/training_state.json +118 -0
- checkpoints/step_00020000/.complete +9 -0
- checkpoints/step_00020000/config.json +43 -0
- checkpoints/step_00020000/model.safetensors +3 -0
- checkpoints/step_00020000/optimizer.safetensors +3 -0
- checkpoints/step_00020000/training_state.json +118 -0
- checkpoints/step_00025000/.complete +9 -0
- checkpoints/step_00025000/config.json +43 -0
- checkpoints/step_00025000/model.safetensors +3 -0
- checkpoints/step_00025000/optimizer.safetensors +3 -0
- checkpoints/step_00025000/training_state.json +118 -0
- checkpoints/step_00030000/.complete +9 -0
- checkpoints/step_00030000/config.json +43 -0
- checkpoints/step_00030000/model.safetensors +3 -0
- checkpoints/step_00030000/optimizer.safetensors +3 -0
- checkpoints/step_00030000/training_state.json +118 -0
- checkpoints/step_00035000/.complete +9 -0
- checkpoints/step_00035000/config.json +43 -0
- checkpoints/step_00035000/model.safetensors +3 -0
- checkpoints/step_00035000/optimizer.safetensors +3 -0
- checkpoints/step_00035000/training_state.json +118 -0
- checkpoints/step_00040000/.complete +9 -0
- checkpoints/step_00040000/config.json +43 -0
- checkpoints/step_00040000/model.safetensors +3 -0
- checkpoints/step_00040000/optimizer.safetensors +3 -0
- checkpoints/step_00040000/training_state.json +118 -0
- checkpoints/step_00045000/.complete +9 -0
- checkpoints/step_00045000/config.json +43 -0
- checkpoints/step_00045000/model.safetensors +3 -0
- checkpoints/step_00045000/optimizer.safetensors +3 -0
- checkpoints/step_00045000/training_state.json +118 -0
- checkpoints/step_00050000/.complete +9 -0
- checkpoints/step_00050000/config.json +43 -0
- checkpoints/step_00050000/model.safetensors +3 -0
- checkpoints/step_00050000/optimizer.safetensors +3 -0
- checkpoints/step_00050000/training_state.json +118 -0
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "46cdf2672363f6db6e2dff794dc7b453ce4e3ed72668f73fb5970bfedc6a844b",
|
| 6 |
+
"optimizer.safetensors": "69da912f8a65bb55d73b70cb1a07d24749b76808930d61ceba493d504959f1a2",
|
| 7 |
+
"training_state.json": "d848511b44cf0079a7afc137e997678d99e345b4cbc3ee8789e26c0412962760"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46cdf2672363f6db6e2dff794dc7b453ce4e3ed72668f73fb5970bfedc6a844b
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69da912f8a65bb55d73b70cb1a07d24749b76808930d61ceba493d504959f1a2
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 5000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 5000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 262144.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 1000
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.00015,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "57df026b62563f00a4e03423f95ea04fa5701a8538f1e76c51508dfd550f64a7",
|
| 6 |
+
"optimizer.safetensors": "be8f77774c4ccd78dff442f97899e5c92d45e21bc8ff71eea576e5b5547352e9",
|
| 7 |
+
"training_state.json": "80b91a2142500ba9dff4cb75e047b62b9ac7d6e676ce599693af213e9ae1e96c"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57df026b62563f00a4e03423f95ea04fa5701a8538f1e76c51508dfd550f64a7
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be8f77774c4ccd78dff442f97899e5c92d45e21bc8ff71eea576e5b5547352e9
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 10000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 10000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 524288.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 1852
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.0003,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "8a596bd1484b63eef2080cafb8a4b4130db4869c302f7192c0f5cd8ad69c586a",
|
| 6 |
+
"optimizer.safetensors": "0dbb9629499db58f9fb2b8ef82e4b24d9d861f71f6fbffbcfd19842acb8515a1",
|
| 7 |
+
"training_state.json": "985a68e3a2d1b9eab3c420cc4187c65d1a632e9c621eaa077bd7e7ade0240a1e"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a596bd1484b63eef2080cafb8a4b4130db4869c302f7192c0f5cd8ad69c586a
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0dbb9629499db58f9fb2b8ef82e4b24d9d861f71f6fbffbcfd19842acb8515a1
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 15000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 15000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 1048576.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 704
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.0002995389065559004,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "63c8de714528a31192fe48e0464656eba0f5e3a0fb087e42f67a66a3e629a810",
|
| 6 |
+
"optimizer.safetensors": "b3623f7342dbafaf20604f3d21a89a4957a438838616e62f03f548e5c00fd0cd",
|
| 7 |
+
"training_state.json": "17c547ce4a162cdaf82cf1d89ec6ee7002e4ed8094acfcc15490a1794970a3b2"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63c8de714528a31192fe48e0464656eba0f5e3a0fb087e42f67a66a3e629a810
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3623f7342dbafaf20604f3d21a89a4957a438838616e62f03f548e5c00fd0cd
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 20000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 20000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 524288.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 370
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.0002981587759593675,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "79b501cee21d7a9f36195c9d8cb5f408470e7b1f4e33f05c5d79b3b892a5c588",
|
| 6 |
+
"optimizer.safetensors": "0d3a6f6cfe0ef2a5d08bad2eabd6ea1b45df2e41c049fd2f36488c3931268ff0",
|
| 7 |
+
"training_state.json": "c44769a606d9f82a04b0ef12c344c9070454d9d400073a399665503933edf5b4"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79b501cee21d7a9f36195c9d8cb5f408470e7b1f4e33f05c5d79b3b892a5c588
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d3a6f6cfe0ef2a5d08bad2eabd6ea1b45df2e41c049fd2f36488c3931268ff0
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 25000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 25000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 262144.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 492
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.00029586903590180956,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "b70b6d6386dfa9f89737337ee1fbb6a0b892cf92cfb452027143fb916680dde0",
|
| 6 |
+
"optimizer.safetensors": "27f21456f5b6a7a90e08a9ea00cfb6e60135de4bf215f117a7af90a8012d1995",
|
| 7 |
+
"training_state.json": "78064f173c8dcf6a15aa506f2c1fff9b7675b88a202054b0597807c3d9a55637"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b70b6d6386dfa9f89737337ee1fbb6a0b892cf92cfb452027143fb916680dde0
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27f21456f5b6a7a90e08a9ea00cfb6e60135de4bf215f117a7af90a8012d1995
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 30000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 30000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 524288.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 697
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.0002926853276295856,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "cc7acb7a77834621774e0a65745bcd0a9cf0162240acb096efd2e598a9d4d1d2",
|
| 6 |
+
"optimizer.safetensors": "612cad9530ec79af4dae69f0b1e2ecd777bdcb43b469fe0a4388ca9050463ddb",
|
| 7 |
+
"training_state.json": "f9974867887971db55b77cb9496a968599ea6e4a4a0e71bfe58da741e06e68d0"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc7acb7a77834621774e0a65745bcd0a9cf0162240acb096efd2e598a9d4d1d2
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:612cad9530ec79af4dae69f0b1e2ecd777bdcb43b469fe0a4388ca9050463ddb
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 35000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 35000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 131072.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 1756
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.00028862939909843273,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "fe98152386859314cd81661d3d7a6ee2e567571c4acab064ae921eca9f1fc9d5",
|
| 6 |
+
"optimizer.safetensors": "19d8e2a91d9f8e1aafb2102af702a4b183ebad983c02e088d012a194545d24c9",
|
| 7 |
+
"training_state.json": "689ffcfe1380b3b7654dcc2c3c5e8817064358d613965ec381ec139773c17bc5"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe98152386859314cd81661d3d7a6ee2e567571c4acab064ae921eca9f1fc9d5
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19d8e2a91d9f8e1aafb2102af702a4b183ebad983c02e088d012a194545d24c9
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 40000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 40000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 131072.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 862
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.000283728956412876,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "54ce3157e913d205c070d4adab9c609f1694abfb8ccfaa49d6a401026c63a2b3",
|
| 6 |
+
"optimizer.safetensors": "71d9cb483d91cd1687474153bb0684f40a712d517e4fe03a80713adcf0245d63",
|
| 7 |
+
"training_state.json": "ca4991b2296afff8e99fc36950975f1fc93cccf3d9418946168f840b9da1e01e"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54ce3157e913d205c070d4adab9c609f1694abfb8ccfaa49d6a401026c63a2b3
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71d9cb483d91cd1687474153bb0684f40a712d517e4fe03a80713adcf0245d63
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 45000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 45000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 262144.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 1518
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.00027801747456544134,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"files": {
|
| 4 |
+
"config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
|
| 5 |
+
"model.safetensors": "256f468f937ce337cc2d36788d20ccf95ea7cf3d7bdea251d00f60ee0ccb5298",
|
| 6 |
+
"optimizer.safetensors": "5d3d1e3e0ecbb83d069d0b3b2835e4dd86109f864c6dcfc2d00b07b82ad57c08",
|
| 7 |
+
"training_state.json": "f88bbaa054f989ba0228a1ce8e17f7fd7b66ec1cff2db8d56e14edc583c1f528"
|
| 8 |
+
}
|
| 9 |
+
}
|
|
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"checkpoint_type": "pretrain",
|
| 4 |
+
"model_config": {
|
| 5 |
+
"vocab_size": 1980,
|
| 6 |
+
"max_seq_len": 512,
|
| 7 |
+
"n_outcomes": 11,
|
| 8 |
+
"d_model": 512,
|
| 9 |
+
"n_layers": 8,
|
| 10 |
+
"n_heads": 8,
|
| 11 |
+
"d_ff": 2048,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"rope_base": 10000.0
|
| 14 |
+
},
|
| 15 |
+
"training_config": {
|
| 16 |
+
"lr": 0.0003,
|
| 17 |
+
"weight_decay": 0.01,
|
| 18 |
+
"max_grad_norm": 1.0,
|
| 19 |
+
"warmup_steps": 10000,
|
| 20 |
+
"total_steps": 200000,
|
| 21 |
+
"batch_size": 256,
|
| 22 |
+
"max_ply": 512,
|
| 23 |
+
"discard_ply_limit": false,
|
| 24 |
+
"num_workers": 4,
|
| 25 |
+
"use_amp": true,
|
| 26 |
+
"accumulation_steps": 1,
|
| 27 |
+
"log_interval": 50,
|
| 28 |
+
"eval_interval": 1000,
|
| 29 |
+
"checkpoint_interval": 5000,
|
| 30 |
+
"pause_after_steps": null,
|
| 31 |
+
"no_outcome_token": false,
|
| 32 |
+
"prepend_outcome": false,
|
| 33 |
+
"mate_boost": 0.0,
|
| 34 |
+
"base_seed": 42,
|
| 35 |
+
"val_seed": 9223372036854775807,
|
| 36 |
+
"val_games": 2048,
|
| 37 |
+
"checkpoint_dir": "checkpoints",
|
| 38 |
+
"log_dir": "/workspace/logs",
|
| 39 |
+
"use_wandb": false,
|
| 40 |
+
"wandb_project": "pawn",
|
| 41 |
+
"device": "cuda"
|
| 42 |
+
}
|
| 43 |
+
}
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:256f468f937ce337cc2d36788d20ccf95ea7cf3d7bdea251d00f60ee0ccb5298
|
| 3 |
+
size 138612064
|
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d3d1e3e0ecbb83d069d0b3b2835e4dd86109f864c6dcfc2d00b07b82ad57c08
|
| 3 |
+
size 277229900
|
|
@@ -0,0 +1,118 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"format_version": 1,
|
| 3 |
+
"global_step": 50000,
|
| 4 |
+
"scheduler_state_dict": {
|
| 5 |
+
"step": 50000
|
| 6 |
+
},
|
| 7 |
+
"scaler_state_dict": {
|
| 8 |
+
"scale": 524288.0,
|
| 9 |
+
"growth_factor": 2.0,
|
| 10 |
+
"backoff_factor": 0.5,
|
| 11 |
+
"growth_interval": 2000,
|
| 12 |
+
"_growth_tracker": 624
|
| 13 |
+
},
|
| 14 |
+
"optimizer_meta": {
|
| 15 |
+
"param_groups": [
|
| 16 |
+
{
|
| 17 |
+
"lr": 0.0002715339687685131,
|
| 18 |
+
"betas": [
|
| 19 |
+
0.9,
|
| 20 |
+
0.999
|
| 21 |
+
],
|
| 22 |
+
"eps": 1e-08,
|
| 23 |
+
"weight_decay": 0.01,
|
| 24 |
+
"amsgrad": false,
|
| 25 |
+
"maximize": false,
|
| 26 |
+
"foreach": null,
|
| 27 |
+
"capturable": false,
|
| 28 |
+
"differentiable": false,
|
| 29 |
+
"fused": null,
|
| 30 |
+
"decoupled_weight_decay": true,
|
| 31 |
+
"params": [
|
| 32 |
+
0,
|
| 33 |
+
1,
|
| 34 |
+
2,
|
| 35 |
+
3,
|
| 36 |
+
4,
|
| 37 |
+
5,
|
| 38 |
+
6,
|
| 39 |
+
7,
|
| 40 |
+
8,
|
| 41 |
+
9,
|
| 42 |
+
10,
|
| 43 |
+
11,
|
| 44 |
+
12,
|
| 45 |
+
13,
|
| 46 |
+
14,
|
| 47 |
+
15,
|
| 48 |
+
16,
|
| 49 |
+
17,
|
| 50 |
+
18,
|
| 51 |
+
19,
|
| 52 |
+
20,
|
| 53 |
+
21,
|
| 54 |
+
22,
|
| 55 |
+
23,
|
| 56 |
+
24,
|
| 57 |
+
25,
|
| 58 |
+
26,
|
| 59 |
+
27,
|
| 60 |
+
28,
|
| 61 |
+
29,
|
| 62 |
+
30,
|
| 63 |
+
31,
|
| 64 |
+
32,
|
| 65 |
+
33,
|
| 66 |
+
34,
|
| 67 |
+
35,
|
| 68 |
+
36,
|
| 69 |
+
37,
|
| 70 |
+
38,
|
| 71 |
+
39,
|
| 72 |
+
40,
|
| 73 |
+
41,
|
| 74 |
+
42,
|
| 75 |
+
43,
|
| 76 |
+
44,
|
| 77 |
+
45,
|
| 78 |
+
46,
|
| 79 |
+
47,
|
| 80 |
+
48,
|
| 81 |
+
49,
|
| 82 |
+
50,
|
| 83 |
+
51,
|
| 84 |
+
52,
|
| 85 |
+
53,
|
| 86 |
+
54,
|
| 87 |
+
55,
|
| 88 |
+
56,
|
| 89 |
+
57,
|
| 90 |
+
58,
|
| 91 |
+
59,
|
| 92 |
+
60,
|
| 93 |
+
61,
|
| 94 |
+
62,
|
| 95 |
+
63,
|
| 96 |
+
64,
|
| 97 |
+
65,
|
| 98 |
+
66,
|
| 99 |
+
67,
|
| 100 |
+
68,
|
| 101 |
+
69,
|
| 102 |
+
70,
|
| 103 |
+
71,
|
| 104 |
+
72,
|
| 105 |
+
73,
|
| 106 |
+
74,
|
| 107 |
+
75,
|
| 108 |
+
76,
|
| 109 |
+
77,
|
| 110 |
+
78
|
| 111 |
+
]
|
| 112 |
+
}
|
| 113 |
+
],
|
| 114 |
+
"scalars": null
|
| 115 |
+
},
|
| 116 |
+
"torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
|
| 117 |
+
"cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
|
| 118 |
+
}
|