thomas-schweich commited on
Commit
91994e5
·
1 Parent(s): 818e5c9

v1.0.0: searchless_chess vocab, 512 context, 200K steps

Browse files

Squash-merge of run/co_pretraining_2026_04_13 into main.

Replaces the legacy backbone (4,278-token coordinate vocab, 256 context,
prepend_outcome=True, 100K steps) with the v1.0.0 backbone:

- 1,980-token searchless_chess action vocabulary (1,968 reachable actions
+ 1 PAD + 11 outcome tokens)
- 512-token context window
- prepend_outcome=False (no outcome conditioning)
- 200K training steps at batch size 256 (best checkpoint at step 195K)
- 34.65M parameters

Published model.safetensors is the best 5K-cadence checkpoint by val
loss (step 195,000). All intermediate 5K checkpoints are preserved under
checkpoints/ for training-dynamics analysis.

The legacy checkpoint is preserved in the git history of this repo and
is also available at thomas-schweich/pawn-base-legacy.

This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoints/step_00005000/.complete +9 -0
  2. checkpoints/step_00005000/config.json +43 -0
  3. checkpoints/step_00005000/model.safetensors +3 -0
  4. checkpoints/step_00005000/optimizer.safetensors +3 -0
  5. checkpoints/step_00005000/training_state.json +118 -0
  6. checkpoints/step_00010000/.complete +9 -0
  7. checkpoints/step_00010000/config.json +43 -0
  8. checkpoints/step_00010000/model.safetensors +3 -0
  9. checkpoints/step_00010000/optimizer.safetensors +3 -0
  10. checkpoints/step_00010000/training_state.json +118 -0
  11. checkpoints/step_00015000/.complete +9 -0
  12. checkpoints/step_00015000/config.json +43 -0
  13. checkpoints/step_00015000/model.safetensors +3 -0
  14. checkpoints/step_00015000/optimizer.safetensors +3 -0
  15. checkpoints/step_00015000/training_state.json +118 -0
  16. checkpoints/step_00020000/.complete +9 -0
  17. checkpoints/step_00020000/config.json +43 -0
  18. checkpoints/step_00020000/model.safetensors +3 -0
  19. checkpoints/step_00020000/optimizer.safetensors +3 -0
  20. checkpoints/step_00020000/training_state.json +118 -0
  21. checkpoints/step_00025000/.complete +9 -0
  22. checkpoints/step_00025000/config.json +43 -0
  23. checkpoints/step_00025000/model.safetensors +3 -0
  24. checkpoints/step_00025000/optimizer.safetensors +3 -0
  25. checkpoints/step_00025000/training_state.json +118 -0
  26. checkpoints/step_00030000/.complete +9 -0
  27. checkpoints/step_00030000/config.json +43 -0
  28. checkpoints/step_00030000/model.safetensors +3 -0
  29. checkpoints/step_00030000/optimizer.safetensors +3 -0
  30. checkpoints/step_00030000/training_state.json +118 -0
  31. checkpoints/step_00035000/.complete +9 -0
  32. checkpoints/step_00035000/config.json +43 -0
  33. checkpoints/step_00035000/model.safetensors +3 -0
  34. checkpoints/step_00035000/optimizer.safetensors +3 -0
  35. checkpoints/step_00035000/training_state.json +118 -0
  36. checkpoints/step_00040000/.complete +9 -0
  37. checkpoints/step_00040000/config.json +43 -0
  38. checkpoints/step_00040000/model.safetensors +3 -0
  39. checkpoints/step_00040000/optimizer.safetensors +3 -0
  40. checkpoints/step_00040000/training_state.json +118 -0
  41. checkpoints/step_00045000/.complete +9 -0
  42. checkpoints/step_00045000/config.json +43 -0
  43. checkpoints/step_00045000/model.safetensors +3 -0
  44. checkpoints/step_00045000/optimizer.safetensors +3 -0
  45. checkpoints/step_00045000/training_state.json +118 -0
  46. checkpoints/step_00050000/.complete +9 -0
  47. checkpoints/step_00050000/config.json +43 -0
  48. checkpoints/step_00050000/model.safetensors +3 -0
  49. checkpoints/step_00050000/optimizer.safetensors +3 -0
  50. checkpoints/step_00050000/training_state.json +118 -0
checkpoints/step_00005000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "46cdf2672363f6db6e2dff794dc7b453ce4e3ed72668f73fb5970bfedc6a844b",
6
+ "optimizer.safetensors": "69da912f8a65bb55d73b70cb1a07d24749b76808930d61ceba493d504959f1a2",
7
+ "training_state.json": "d848511b44cf0079a7afc137e997678d99e345b4cbc3ee8789e26c0412962760"
8
+ }
9
+ }
checkpoints/step_00005000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00005000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46cdf2672363f6db6e2dff794dc7b453ce4e3ed72668f73fb5970bfedc6a844b
3
+ size 138612064
checkpoints/step_00005000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69da912f8a65bb55d73b70cb1a07d24749b76808930d61ceba493d504959f1a2
3
+ size 277229900
checkpoints/step_00005000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 5000,
4
+ "scheduler_state_dict": {
5
+ "step": 5000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 262144.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 1000
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.00015,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00010000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "57df026b62563f00a4e03423f95ea04fa5701a8538f1e76c51508dfd550f64a7",
6
+ "optimizer.safetensors": "be8f77774c4ccd78dff442f97899e5c92d45e21bc8ff71eea576e5b5547352e9",
7
+ "training_state.json": "80b91a2142500ba9dff4cb75e047b62b9ac7d6e676ce599693af213e9ae1e96c"
8
+ }
9
+ }
checkpoints/step_00010000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00010000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57df026b62563f00a4e03423f95ea04fa5701a8538f1e76c51508dfd550f64a7
3
+ size 138612064
checkpoints/step_00010000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be8f77774c4ccd78dff442f97899e5c92d45e21bc8ff71eea576e5b5547352e9
3
+ size 277229900
checkpoints/step_00010000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 10000,
4
+ "scheduler_state_dict": {
5
+ "step": 10000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 524288.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 1852
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.0003,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00015000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "8a596bd1484b63eef2080cafb8a4b4130db4869c302f7192c0f5cd8ad69c586a",
6
+ "optimizer.safetensors": "0dbb9629499db58f9fb2b8ef82e4b24d9d861f71f6fbffbcfd19842acb8515a1",
7
+ "training_state.json": "985a68e3a2d1b9eab3c420cc4187c65d1a632e9c621eaa077bd7e7ade0240a1e"
8
+ }
9
+ }
checkpoints/step_00015000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00015000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a596bd1484b63eef2080cafb8a4b4130db4869c302f7192c0f5cd8ad69c586a
3
+ size 138612064
checkpoints/step_00015000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dbb9629499db58f9fb2b8ef82e4b24d9d861f71f6fbffbcfd19842acb8515a1
3
+ size 277229900
checkpoints/step_00015000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 15000,
4
+ "scheduler_state_dict": {
5
+ "step": 15000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 1048576.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 704
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.0002995389065559004,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00020000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "63c8de714528a31192fe48e0464656eba0f5e3a0fb087e42f67a66a3e629a810",
6
+ "optimizer.safetensors": "b3623f7342dbafaf20604f3d21a89a4957a438838616e62f03f548e5c00fd0cd",
7
+ "training_state.json": "17c547ce4a162cdaf82cf1d89ec6ee7002e4ed8094acfcc15490a1794970a3b2"
8
+ }
9
+ }
checkpoints/step_00020000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00020000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63c8de714528a31192fe48e0464656eba0f5e3a0fb087e42f67a66a3e629a810
3
+ size 138612064
checkpoints/step_00020000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3623f7342dbafaf20604f3d21a89a4957a438838616e62f03f548e5c00fd0cd
3
+ size 277229900
checkpoints/step_00020000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 20000,
4
+ "scheduler_state_dict": {
5
+ "step": 20000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 524288.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 370
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.0002981587759593675,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00025000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "79b501cee21d7a9f36195c9d8cb5f408470e7b1f4e33f05c5d79b3b892a5c588",
6
+ "optimizer.safetensors": "0d3a6f6cfe0ef2a5d08bad2eabd6ea1b45df2e41c049fd2f36488c3931268ff0",
7
+ "training_state.json": "c44769a606d9f82a04b0ef12c344c9070454d9d400073a399665503933edf5b4"
8
+ }
9
+ }
checkpoints/step_00025000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00025000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79b501cee21d7a9f36195c9d8cb5f408470e7b1f4e33f05c5d79b3b892a5c588
3
+ size 138612064
checkpoints/step_00025000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d3a6f6cfe0ef2a5d08bad2eabd6ea1b45df2e41c049fd2f36488c3931268ff0
3
+ size 277229900
checkpoints/step_00025000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 25000,
4
+ "scheduler_state_dict": {
5
+ "step": 25000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 262144.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 492
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.00029586903590180956,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00030000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "b70b6d6386dfa9f89737337ee1fbb6a0b892cf92cfb452027143fb916680dde0",
6
+ "optimizer.safetensors": "27f21456f5b6a7a90e08a9ea00cfb6e60135de4bf215f117a7af90a8012d1995",
7
+ "training_state.json": "78064f173c8dcf6a15aa506f2c1fff9b7675b88a202054b0597807c3d9a55637"
8
+ }
9
+ }
checkpoints/step_00030000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00030000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b70b6d6386dfa9f89737337ee1fbb6a0b892cf92cfb452027143fb916680dde0
3
+ size 138612064
checkpoints/step_00030000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27f21456f5b6a7a90e08a9ea00cfb6e60135de4bf215f117a7af90a8012d1995
3
+ size 277229900
checkpoints/step_00030000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 30000,
4
+ "scheduler_state_dict": {
5
+ "step": 30000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 524288.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 697
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.0002926853276295856,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00035000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "cc7acb7a77834621774e0a65745bcd0a9cf0162240acb096efd2e598a9d4d1d2",
6
+ "optimizer.safetensors": "612cad9530ec79af4dae69f0b1e2ecd777bdcb43b469fe0a4388ca9050463ddb",
7
+ "training_state.json": "f9974867887971db55b77cb9496a968599ea6e4a4a0e71bfe58da741e06e68d0"
8
+ }
9
+ }
checkpoints/step_00035000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00035000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc7acb7a77834621774e0a65745bcd0a9cf0162240acb096efd2e598a9d4d1d2
3
+ size 138612064
checkpoints/step_00035000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612cad9530ec79af4dae69f0b1e2ecd777bdcb43b469fe0a4388ca9050463ddb
3
+ size 277229900
checkpoints/step_00035000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 35000,
4
+ "scheduler_state_dict": {
5
+ "step": 35000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 131072.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 1756
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.00028862939909843273,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00040000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "fe98152386859314cd81661d3d7a6ee2e567571c4acab064ae921eca9f1fc9d5",
6
+ "optimizer.safetensors": "19d8e2a91d9f8e1aafb2102af702a4b183ebad983c02e088d012a194545d24c9",
7
+ "training_state.json": "689ffcfe1380b3b7654dcc2c3c5e8817064358d613965ec381ec139773c17bc5"
8
+ }
9
+ }
checkpoints/step_00040000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00040000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe98152386859314cd81661d3d7a6ee2e567571c4acab064ae921eca9f1fc9d5
3
+ size 138612064
checkpoints/step_00040000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19d8e2a91d9f8e1aafb2102af702a4b183ebad983c02e088d012a194545d24c9
3
+ size 277229900
checkpoints/step_00040000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 40000,
4
+ "scheduler_state_dict": {
5
+ "step": 40000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 131072.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 862
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.000283728956412876,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00045000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "54ce3157e913d205c070d4adab9c609f1694abfb8ccfaa49d6a401026c63a2b3",
6
+ "optimizer.safetensors": "71d9cb483d91cd1687474153bb0684f40a712d517e4fe03a80713adcf0245d63",
7
+ "training_state.json": "ca4991b2296afff8e99fc36950975f1fc93cccf3d9418946168f840b9da1e01e"
8
+ }
9
+ }
checkpoints/step_00045000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00045000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54ce3157e913d205c070d4adab9c609f1694abfb8ccfaa49d6a401026c63a2b3
3
+ size 138612064
checkpoints/step_00045000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71d9cb483d91cd1687474153bb0684f40a712d517e4fe03a80713adcf0245d63
3
+ size 277229900
checkpoints/step_00045000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 45000,
4
+ "scheduler_state_dict": {
5
+ "step": 45000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 262144.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 1518
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.00027801747456544134,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }
checkpoints/step_00050000/.complete ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "files": {
4
+ "config.json": "4ab163e389461a686fdd4db069900b3bd84ce8ce5340aa165dbc7c09ebea8084",
5
+ "model.safetensors": "256f468f937ce337cc2d36788d20ccf95ea7cf3d7bdea251d00f60ee0ccb5298",
6
+ "optimizer.safetensors": "5d3d1e3e0ecbb83d069d0b3b2835e4dd86109f864c6dcfc2d00b07b82ad57c08",
7
+ "training_state.json": "f88bbaa054f989ba0228a1ce8e17f7fd7b66ec1cff2db8d56e14edc583c1f528"
8
+ }
9
+ }
checkpoints/step_00050000/config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "checkpoint_type": "pretrain",
4
+ "model_config": {
5
+ "vocab_size": 1980,
6
+ "max_seq_len": 512,
7
+ "n_outcomes": 11,
8
+ "d_model": 512,
9
+ "n_layers": 8,
10
+ "n_heads": 8,
11
+ "d_ff": 2048,
12
+ "dropout": 0.0,
13
+ "rope_base": 10000.0
14
+ },
15
+ "training_config": {
16
+ "lr": 0.0003,
17
+ "weight_decay": 0.01,
18
+ "max_grad_norm": 1.0,
19
+ "warmup_steps": 10000,
20
+ "total_steps": 200000,
21
+ "batch_size": 256,
22
+ "max_ply": 512,
23
+ "discard_ply_limit": false,
24
+ "num_workers": 4,
25
+ "use_amp": true,
26
+ "accumulation_steps": 1,
27
+ "log_interval": 50,
28
+ "eval_interval": 1000,
29
+ "checkpoint_interval": 5000,
30
+ "pause_after_steps": null,
31
+ "no_outcome_token": false,
32
+ "prepend_outcome": false,
33
+ "mate_boost": 0.0,
34
+ "base_seed": 42,
35
+ "val_seed": 9223372036854775807,
36
+ "val_games": 2048,
37
+ "checkpoint_dir": "checkpoints",
38
+ "log_dir": "/workspace/logs",
39
+ "use_wandb": false,
40
+ "wandb_project": "pawn",
41
+ "device": "cuda"
42
+ }
43
+ }
checkpoints/step_00050000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:256f468f937ce337cc2d36788d20ccf95ea7cf3d7bdea251d00f60ee0ccb5298
3
+ size 138612064
checkpoints/step_00050000/optimizer.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d3d1e3e0ecbb83d069d0b3b2835e4dd86109f864c6dcfc2d00b07b82ad57c08
3
+ size 277229900
checkpoints/step_00050000/training_state.json ADDED
@@ -0,0 +1,118 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "global_step": 50000,
4
+ "scheduler_state_dict": {
5
+ "step": 50000
6
+ },
7
+ "scaler_state_dict": {
8
+ "scale": 524288.0,
9
+ "growth_factor": 2.0,
10
+ "backoff_factor": 0.5,
11
+ "growth_interval": 2000,
12
+ "_growth_tracker": 624
13
+ },
14
+ "optimizer_meta": {
15
+ "param_groups": [
16
+ {
17
+ "lr": 0.0002715339687685131,
18
+ "betas": [
19
+ 0.9,
20
+ 0.999
21
+ ],
22
+ "eps": 1e-08,
23
+ "weight_decay": 0.01,
24
+ "amsgrad": false,
25
+ "maximize": false,
26
+ "foreach": null,
27
+ "capturable": false,
28
+ "differentiable": false,
29
+ "fused": null,
30
+ "decoupled_weight_decay": true,
31
+ "params": [
32
+ 0,
33
+ 1,
34
+ 2,
35
+ 3,
36
+ 4,
37
+ 5,
38
+ 6,
39
+ 7,
40
+ 8,
41
+ 9,
42
+ 10,
43
+ 11,
44
+ 12,
45
+ 13,
46
+ 14,
47
+ 15,
48
+ 16,
49
+ 17,
50
+ 18,
51
+ 19,
52
+ 20,
53
+ 21,
54
+ 22,
55
+ 23,
56
+ 24,
57
+ 25,
58
+ 26,
59
+ 27,
60
+ 28,
61
+ 29,
62
+ 30,
63
+ 31,
64
+ 32,
65
+ 33,
66
+ 34,
67
+ 35,
68
+ 36,
69
+ 37,
70
+ 38,
71
+ 39,
72
+ 40,
73
+ 41,
74
+ 42,
75
+ 43,
76
+ 44,
77
+ 45,
78
+ 46,
79
+ 47,
80
+ 48,
81
+ 49,
82
+ 50,
83
+ 51,
84
+ 52,
85
+ 53,
86
+ 54,
87
+ 55,
88
+ 56,
89
+ 57,
90
+ 58,
91
+ 59,
92
+ 60,
93
+ 61,
94
+ 62,
95
+ 63,
96
+ 64,
97
+ 65,
98
+ 66,
99
+ 67,
100
+ 68,
101
+ 69,
102
+ 70,
103
+ 71,
104
+ 72,
105
+ 73,
106
+ 74,
107
+ 75,
108
+ 76,
109
+ 77,
110
+ 78
111
+ ]
112
+ }
113
+ ],
114
+ "scalars": null
115
+ },
116
+ "torch_rng_state": "hljcGxUfSQ+fAQAAAQAAANIAAAAAAAAAzj3uUQAAAAAlDbfbAAAAAODXdhYAAAAAHAdTtgAAAABPp7tMAAAAAASjDTUAAAAA5xmHeQAAAADgrPl2AAAAAGDTO+4AAAAAEV5vpQAAAAAoLmVHAAAAAOM3XOwAAAAArcqH+QAAAADiw0BbAAAAAGj5lM8AAAAAcw+GYgAAAACrLjMSAAAAADGQlT4AAAAAaZpDJQAAAACBzZ+gAAAAAPc+rTkAAAAAFSQBQwAAAADp6uHMAAAAAHNXWQYAAAAA2lY4AwAAAAAXrHbYAAAAAKP1wi0AAAAA4zBXUwAAAAASoagbAAAAAAMltJoAAAAAyJh3RwAAAACMKoqOAAAAAEFk+8UAAAAABdjhIAAAAACeoY6ZAAAAAN6XSAgAAAAA4I5MvgAAAADLcLbFAAAAAJBiDvMAAAAABtjFygAAAAD/E32LAAAAAEgRBGMAAAAA7SItpwAAAAA8l1BPAAAAAIp05iwAAAAAcqnPuQAAAABhWFc4AAAAAN3gcLsAAAAAqRf8NAAAAADfX3chAAAAADop2cYAAAAAXkRDAAAAAAAE9144AAAAAIeDKI4AAAAAy6DHcAAAAABuF9jQAAAAABddICQAAAAAdqW3OgAAAACWziEwAAAAAGmr+FAAAAAAj1XhIAAAAAC/foK4AAAAAAH5SLYAAAAAI6MKfAAAAACLG+U3AAAAADn/ly0AAAAANgH0tAAAAABN+QB2AAAAAAly8WIAAAAA5AHsOQAAAAAhSzuMAAAAAAflo4YAAAAAcREqzgAAAADCEfxMAAAAAH0l6y4AAAAAcGr/nQAAAAAqDd21AAAAAJYzfLEAAAAAI3IK4wAAAAB1YRabAAAAAOhNxmwAAAAA6N/jNwAAAACIiTZQAAAAAJXTfhgAAAAAK1dacAAAAAA3A/CSAAAAAMAY52MAAAAASmYhwAAAAAAhywp5AAAAAJLXrvIAAAAABIg7zAAAAAC/Pf4IAAAAAAt1nVQAAAAAo9VJOAAAAADwcwdYAAAAAEbzUaYAAAAA6XoZHQAAAACTcjjdAAAAANXrCksAAAAA0oqT3gAAAACzxja2AAAAAJ+cHWQAAAAAMTfUOAAAAAAF5ZPAAAAAADzzboQAAAAAhOYUwwAAAAAuufxEAAAAANB6LDwAAAAAw2ouuwAAAABUF4EMAAAAAGKc/FMAAAAAxoYYWwAAAACideOdAAAAAOxJAuQAAAAAiaBQZwAAAAAbUJMKAAAAADOqykYAAAAAFw4BNgAAAABlBOehAAAAAArQmRIAAAAAnrPfGQAAAACN1jNwAAAAAGyEccoAAAAAp7rovAAAAAAGI0Z3AAAAALb8PJwAAAAALIImuQAAAACQJRU8AAAAAG5cKlkAAAAAIG6fBgAAAAACC273AAAAAP7o+5gAAAAAToXBRwAAAADFqYJ8AAAAAFT/jrsAAAAAYrhP0wAAAABN0ONuAAAAACzQYcAAAAAALM4z2gAAAADLKdG9AAAAAFbJbG4AAAAAi2dK3QAAAADKrnC1AAAAAGsTRpAAAAAANSwMvwAAAABStYiWAAAAADUfVekAAAAAbPDIYgAAAACtadvrAAAAAJbEir8AAAAAcRp4fAAAAADiXAigAAAAAOhvPmUAAAAA56FHTwAAAAD404Q8AAAAAG/Gb1AAAAAABzBngAAAAAB53GsnAAAAACNJByYAAAAAJWk6mAAAAAAR0/H8AAAAABk8q/IAAAAATyzT3QAAAABjLsHtAAAAAHg0v5IAAAAA6OFrMgAAAADajHYNAAAAAG4RtjQAAAAAZ+TORAAAAAAnp1qMAAAAACHwtoMAAAAA+ds8hAAAAABKzPteAAAAAN4eczUAAAAAkvDP0wAAAACqFw2IAAAAAHoBh4cAAAAAePOLRAAAAABT8DC/AAAAADVTwpEAAAAAUYiatQAAAACXZrLGAAAAAN+HV94AAAAAwxkwXQAAAAABQ1UXAAAAAM8BXBAAAAAARVbEhgAAAABnz0LDAAAAAHTQvKQAAAAA4HY1MQAAAABUAbX5AAAAAJgWAP8AAAAABeXZKAAAAABenJweAAAAAEG+UhoAAAAA5NC0pAAAAACDD2m9AAAAAH08/fgAAAAAQAV27AAAAABy04BGAAAAAO1Isa8AAAAAQwhJCwAAAAAlhx20AAAAAFtpMRUAAAAAOho9HQAAAAAiLbXnAAAAACkQ0dEAAAAAZ4mA4gAAAACylZP9AAAAAObE36gAAAAA0oWi3QAAAABLb+MIAAAAAOxj0fIAAAAAltiwmAAAAAAH3U8bAAAAAGcUCo8AAAAApMjanwAAAADJ4qqNAAAAAGpkiMgAAAAAXCXW+AAAAAD6wxo9AAAAALAyHzEAAAAAl44w/QAAAADHBcyvAAAAAGjeZS4AAAAAlvI2NgAAAABQsOQVAAAAAMn5VB8AAAAA270MUQAAAACwmptEAAAAAI5Il2QAAAAASMbr4gAAAAAnA1HMAAAAAPZJyZwAAAAAM/a23QAAAACZ2LlLAAAAAJm6ic4AAAAALfCgigAAAACcnwxSAAAAAK/X8lsAAAAA3eS8AwAAAABGDHhzAAAAAPXy1CQAAAAAD3+vSwAAAADwF1l7AAAAACjQk50AAAAAZA3zGAAAAACUnvzAAAAAAAdBjNMAAAAATfPJPwAAAABLkJCfAAAAAKtnKQsAAAAA3FdwiAAAAACMII9UAAAAAJOB1P0AAAAAhOeLtQAAAAALcTVxAAAAAA0auq0AAAAAu8nHLwAAAABWNSAVAAAAAPduvpIAAAAAKCzZGQAAAACKQpFkAAAAAP+T+IoAAAAAJqrv3QAAAADyaf/GAAAAADSEtpwAAAAA/nbj+QAAAAA/p4CMAAAAAHMd2ZkAAAAA5OCN/gAAAADLZhkKAAAAAHH9PcQAAAAA7As7sQAAAADp584RAAAAAOFghuoAAAAAYSpZeAAAAABqOyxAAAAAAJb5AZkAAAAAHNhbewAAAACruWdUAAAAAIEE2RAAAAAASCZM9AAAAABH2+4+AAAAAHqg1x4AAAAAmwaCDgAAAABZiDpDAAAAALpp8WkAAAAArSNt2AAAAACAI3NMAAAAAK5sIVkAAAAAvrPq9AAAAACn/ZbJAAAAAE1dcIUAAAAAHJptewAAAAAMpNVdAAAAAJD6r4sAAAAAQ8zgSwAAAAAdMeh2AAAAAOH1IFMAAAAA5s/tgQAAAAA5Hmn4AAAAAD0klXcAAAAACWVZYQAAAADv79iWAAAAAPNqwSgAAAAAykW6vAAAAABd1BdYAAAAAISlGyAAAAAABPGqvwAAAAAzMKygAAAAAP7mIPYAAAAANoxv1gAAAAAQO/EvAAAAALzevV8AAAAAMWauuQAAAAB9lS1nAAAAABLXSnAAAAAACY8rLAAAAABu6imZAAAAAApPPxkAAAAAsZI4fwAAAAC0VCfNAAAAAPMGkaUAAAAAo7i9twAAAABgyShMAAAAAO4ZTm0AAAAAXnq4KQAAAADL712mAAAAAKV48z4AAAAAbD77PgAAAABDgyi1AAAAAF1zypgAAAAADED1NQAAAACdQrKsAAAAAMDyv0sAAAAANJNmVAAAAACQJTCWAAAAAKFhpd8AAAAA5dn+rAAAAADZJnjLAAAAAPsJ4DEAAAAA24AiwwAAAAAavNyuAAAAAJ/90BEAAAAAYcYuYwAAAADqjbAXAAAAAFGRlQYAAAAA3BiyxgAAAAAbacbRAAAAAIct0hIAAAAAdxmaPAAAAAAWsk0aAAAAALkGV08AAAAAPlprVAAAAADgvPghAAAAAMDUJL0AAAAAGkuLWwAAAACBczInAAAAAOvMn9AAAAAArLBMOgAAAABSTKSJAAAAAMhvCI4AAAAAe9BgpQAAAAAmEXUwAAAAAIJdol0AAAAAWbmklAAAAACZLiX1AAAAADCnUEsAAAAAdn4b5QAAAABdMEDSAAAAAHiL1TsAAAAAqTnYKQAAAADNLeXxAAAAACoiIRwAAAAAKjX6cQAAAAC50do0AAAAAPf3e8cAAAAAsgk1bgAAAABkW3TRAAAAADRaJYIAAAAAWZdhCQAAAADXiFFwAAAAAPr229wAAAAAMaIXQQAAAABRdq3UAAAAAA754sIAAAAAM0dpbQAAAADzVNFWAAAAABP2M6gAAAAANQUAZwAAAAB/6mUzAAAAABz6VtIAAAAAR82aQgAAAACFyWWoAAAAAEXSQJEAAAAAq1MIyQAAAADmdtDCAAAAAIyfAlMAAAAA1S2biAAAAAD5ht4UAAAAAJ4ITdcAAAAACGZDpAAAAADcT1FtAAAAAFjAPw4AAAAA50Y9RwAAAABxnhZhAAAAAKFjeD0AAAAApIfw+wAAAAB9EQ/HAAAAAGE6DkQAAAAAEX9+IgAAAABGWglfAAAAAGn+J6sAAAAAHlC6gQAAAACJkBE6AAAAAMfj7cMAAAAA+SBbVgAAAABqj5WSAAAAANrwPY4AAAAAg+X9iQAAAACqRLSaAAAAAMmtyHkAAAAAVSX1DQAAAACUE/7bAAAAACvdcOMAAAAAR5cTIQAAAABG6d1bAAAAAH0P85IAAAAAM9OBXgAAAADgEVo3AAAAAL4EtmkAAAAAFu0k3QAAAADUPQN2AAAAAJxxxi0AAAAATgOS1gAAAAAF3krOAAAAAJroewYAAAAAgZ3e0QAAAADyjQwWAAAAAMUurd8AAAAAW2NEZgAAAAAWS3pdAAAAABeXFoIAAAAAfGiTfgAAAABk3nWsAAAAAKhIgLkAAAAAWPFQMgAAAADom33CAAAAACPH41gAAAAAyQp9TgAAAACIP2hdAAAAALAhF/YAAAAATDvpbAAAAAA2FR7bAAAAAPYJcpIAAAAAin3jXgAAAABYltyNAAAAAIpg+ncAAAAA7Va1tQAAAABh4LXsAAAAACrXx+oAAAAA5cCekAAAAACTshg1AAAAAEYaxXAAAAAAA7zFiQAAAADroW2SAAAAAPNdl9wAAAAA5dsX4QAAAAD513YBAAAAAK/w938AAAAATsHv3wAAAADA5xK6AAAAAFxaulgAAAAA8uuuLwAAAAAhyC1jAAAAAB4/5iUAAAAAd860oAAAAAD6dizeAAAAAGbtswYAAAAAgQoojwAAAAAGbUCOAAAAAMs648AAAAAAkfdm2AAAAACNfYnRAAAAAN9oH8cAAAAAvSC+/wAAAADF3yn1AAAAAA1vZPAAAAAAqcLtmAAAAAC7rpqZAAAAAMXEZ4sAAAAARNjWgAAAAABdWyY5AAAAAMEt0jQAAAAAC19z8gAAAAAbqZQPAAAAAK+o9qsAAAAAswuOBgAAAABNAW9GAAAAADt8dF8AAAAAZmMbqgAAAAAPNnCuAAAAAA6DqC0AAAAAhGAFYgAAAAD4nHoyAAAAAIkR+C0AAAAAMLAerQAAAADByP18AAAAAAkH8qEAAAAAHWPWZwAAAAAxMPGHAAAAAELsVw4AAAAAWmd5KwAAAAArsq8/AAAAAJFH0WkAAAAAYTyXywAAAAAjpkmcAAAAAHHaJlQAAAAAr4NHbQAAAAD18ezaAAAAAC5PbzwAAAAAA3gyPQAAAABdThpbAAAAADo+EOgAAAAAIzzALAAAAACmT8oEAAAAAIdvmScAAAAAWi3kQgAAAAA3Y8JQAAAAAKvFxrsAAAAAtjx3AgAAAACxZyDGAAAAAMsolLAAAAAAIGNeQAAAAAA3/8AuAAAAAILty5YAAAAANZSksgAAAAAA1vvJAAAAAJSPF5kAAAAAw57qCQAAAABgpnIHAAAAAPFd/EoAAAAAInH0DgAAAABMy9xzAAAAAOZtFlMAAAAAmldKOQAAAAB5/aofAAAAADAIsywAAAAAnsUS8AAAAAAUuQZGAAAAAAu8oDkAAAAAqvxZgQAAAACSiDrPAAAAAFx5PUQAAAAAqp8DmgAAAACGA3nKAAAAAGV/oVYAAAAAcljhjAAAAAB8PQ+jAAAAAEV+qF4AAAAANMzXTgAAAAAQZqxfAAAAAN60E00AAAAAOG0aAQAAAACCjtNyAAAAAH1BwuAAAAAABNjhCAAAAACFjlG3AAAAAMasoRoAAAAAkKLWjAAAAAAi2G9hAAAAAOPWDZ8AAAAAtqlkLgAAAABo3ad/AAAAAD64FmsAAAAAvC/PSgAAAAA9Hb+xAAAAAK9MAskAAAAAl+XMQgAAAABx39E0AAAAACbIXnwAAAAAJVZ04QAAAABY6X6gAAAAAK3YOHAAAAAAMzZT8QAAAACTuyyGAAAAAL4ATmEAAAAAxd584AAAAACsP8aBAAAAAGtx69oAAAAA9GzMGQAAAADWDVLzAAAAALh9Dl4AAAAAM0x7cQAAAAAD8hzQAAAAAKRxgnsAAAAAYNAHkgAAAAASg9DNAAAAAFVlqe0AAAAAxNytYgAAAADgp8pcAAAAAPJV590AAAAAI08FAAAAAADuVLlZAAAAAAZVpJUAAAAAUeHEowAAAACTWRPMAAAAAIzCkycAAAAANuimLAAAAABrR25WAAAAAAypjtkAAAAA99Xa0QAAAADT7D44AAAAABqQvrcAAAAAlpMhbgAAAAAJeSMxAAAAAHekH1oAAAAAlRRHCgAAAAAjWM/eAAAAAJchAdsAAAAA505bTAAAAABFJtFuAAAAAExN/+EAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA==",
117
+ "cuda_rng_state": "kRard2YmFAAAAAAAAAAAAA=="
118
+ }