Chess Challenge submission by MDaytek
Browse files- README.md +2 -2
- config.json +1 -1
- model.safetensors +2 -2
- vocab.json +56 -1
README.md
CHANGED
|
@@ -14,13 +14,13 @@ Chess model submitted to the LLM Course Chess Challenge.
|
|
| 14 |
## Submission Info
|
| 15 |
|
| 16 |
- **Submitted by**: [MDaytek](https://huggingface.co/MDaytek)
|
| 17 |
-
- **Parameters**:
|
| 18 |
- **Organization**: LLM-course
|
| 19 |
|
| 20 |
## Model Details
|
| 21 |
|
| 22 |
- **Architecture**: Chess Transformer (GPT-style)
|
| 23 |
-
- **Vocab size**:
|
| 24 |
- **Embedding dim**: 120
|
| 25 |
- **Layers**: 5
|
| 26 |
- **Heads**: 8
|
|
|
|
| 14 |
## Submission Info
|
| 15 |
|
| 16 |
- **Submitted by**: [MDaytek](https://huggingface.co/MDaytek)
|
| 17 |
+
- **Parameters**: 993,960
|
| 18 |
- **Organization**: LLM-course
|
| 19 |
|
| 20 |
## Model Details
|
| 21 |
|
| 22 |
- **Architecture**: Chess Transformer (GPT-style)
|
| 23 |
+
- **Vocab size**: 380
|
| 24 |
- **Embedding dim**: 120
|
| 25 |
- **Layers**: 5
|
| 26 |
- **Heads**: 8
|
config.json
CHANGED
|
@@ -14,5 +14,5 @@
|
|
| 14 |
"n_layer": 5,
|
| 15 |
"n_positions": 256,
|
| 16 |
"transformers_version": "4.57.6",
|
| 17 |
-
"vocab_size":
|
| 18 |
}
|
|
|
|
| 14 |
"n_layer": 5,
|
| 15 |
"n_positions": 256,
|
| 16 |
"transformers_version": "4.57.6",
|
| 17 |
+
"vocab_size": 380
|
| 18 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a3ec4490eebae6357516c18e9e1c382007e962d063524cc531762fedb6bbf39
|
| 3 |
+
size 3981576
|
vocab.json
CHANGED
|
@@ -323,5 +323,60 @@
|
|
| 323 |
"WBb5c6(x+)": 321,
|
| 324 |
"WPc2d3(x)": 322,
|
| 325 |
"WPg4f5(x)": 323,
|
| 326 |
-
"WKg2g3": 324
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 327 |
}
|
|
|
|
| 323 |
"WBb5c6(x+)": 321,
|
| 324 |
"WPc2d3(x)": 322,
|
| 325 |
"WPg4f5(x)": 323,
|
| 326 |
+
"WKg2g3": 324,
|
| 327 |
+
"WKe2d3": 325,
|
| 328 |
+
"WBe3d4(x)": 326,
|
| 329 |
+
"WNe5c6(x)": 327,
|
| 330 |
+
"BKf7g6": 328,
|
| 331 |
+
"BPa7b6(x)": 329,
|
| 332 |
+
"BNe7c6": 330,
|
| 333 |
+
"WNg5f3": 331,
|
| 334 |
+
"WKg2h3": 332,
|
| 335 |
+
"WKf2g3": 333,
|
| 336 |
+
"BPf4f3": 334,
|
| 337 |
+
"WKh2g3": 335,
|
| 338 |
+
"WPh5g6(x)": 336,
|
| 339 |
+
"WBc4d5(x)": 337,
|
| 340 |
+
"WQf3g3": 338,
|
| 341 |
+
"BQd8e7(x)": 339,
|
| 342 |
+
"WRe1f1": 340,
|
| 343 |
+
"WPf2g3(x)": 341,
|
| 344 |
+
"BBg7e5(x)": 342,
|
| 345 |
+
"WNf3h2": 343,
|
| 346 |
+
"WBg5e3": 344,
|
| 347 |
+
"WBf1c4(x)": 345,
|
| 348 |
+
"BKe8f7": 346,
|
| 349 |
+
"WRf1f3": 347,
|
| 350 |
+
"BBd6e7": 348,
|
| 351 |
+
"BKf7e7": 349,
|
| 352 |
+
"WBf4e5(x)": 350,
|
| 353 |
+
"WNe4f6(x+)": 351,
|
| 354 |
+
"WKe1d1": 352,
|
| 355 |
+
"WBd2c3": 353,
|
| 356 |
+
"WPg3f4(x)": 354,
|
| 357 |
+
"BQd8e8": 355,
|
| 358 |
+
"WQd1e1": 356,
|
| 359 |
+
"BPa3a2": 357,
|
| 360 |
+
"WRd1c1": 358,
|
| 361 |
+
"BKh7g8": 359,
|
| 362 |
+
"WKh2g1": 360,
|
| 363 |
+
"BPg4g3": 361,
|
| 364 |
+
"WKc1d2": 362,
|
| 365 |
+
"BNd5c3(x)": 363,
|
| 366 |
+
"WPa6a7": 364,
|
| 367 |
+
"BKh8h7": 365,
|
| 368 |
+
"BRe8f8": 366,
|
| 369 |
+
"BRd8c8": 367,
|
| 370 |
+
"WPd5e6(x)": 368,
|
| 371 |
+
"WNe5f3": 369,
|
| 372 |
+
"WRh1d1": 370,
|
| 373 |
+
"WQd1d3(x)": 371,
|
| 374 |
+
"BRh8d8": 372,
|
| 375 |
+
"BKf7f6": 373,
|
| 376 |
+
"BKg7g6": 374,
|
| 377 |
+
"WKf2e2": 375,
|
| 378 |
+
"WBe3d2": 376,
|
| 379 |
+
"WBc4e6(x)": 377,
|
| 380 |
+
"BRc8d8": 378,
|
| 381 |
+
"BKe8f7(x)": 379
|
| 382 |
}
|