MDaytek commited on
Commit
c710f68
·
verified ·
1 Parent(s): c84ac8a

Performance update: 5k games

Browse files
Files changed (4) hide show
  1. README.md +4 -2
  2. config.json +5 -5
  3. model.safetensors +2 -2
  4. tokenizer.json +2 -2
README.md CHANGED
@@ -6,5 +6,7 @@ tags:
6
  - chess-challenge
7
  license: mit
8
  ---
9
- # Submission MDaytek
10
- Fixed n_ctx attribute.
 
 
 
6
  - chess-challenge
7
  license: mit
8
  ---
9
+ # Submission MDaytek (Performance V1)
10
+ Trained on 5000 games.
11
+ Context length: 256.
12
+ Embed dim: 384.
config.json CHANGED
@@ -11,12 +11,12 @@
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
- "n_ctx": 128,
15
- "n_embd": 128,
16
- "n_head": 4,
17
  "n_inner": null,
18
- "n_layer": 4,
19
- "n_positions": 128,
20
  "pad_token_id": 0,
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
 
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
+ "n_ctx": 256,
15
+ "n_embd": 384,
16
+ "n_head": 6,
17
  "n_inner": null,
18
+ "n_layer": 6,
19
+ "n_positions": 256,
20
  "pad_token_id": 0,
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8aabd1d84cb2bd25ebd97a84a9f874fa92c7becb1d546c3ebedb6883d179cf30
3
- size 5375920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12e3558d5b2629de984d1d1a20d8dda60142e5b2465ff6be9b0c0ba9639e971f
3
+ size 49386864
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 128,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 128
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 256
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,