Chess Challenge submission by gbl1357

Files changed (6) hide show

README.md ADDED Viewed

+---
+library_name: transformers
+tags:
+- chess
+- llm-course
+- chess-challenge
+license: mit
+---
+# gbl_chess_3
+Chess model submitted to the LLM Course Chess Challenge.
+## Submission Info
+- **Submitted by**: [gbl1357](https://huggingface.co/gbl1357)
+- **Parameters**: 999,024
+- **Organization**: LLM-course
+## Model Details
+- **Architecture**: Chess Transformer (GPT-style)
+- **Vocab size**: 84
+- **Embedding dim**: 128
+- **Layers**: 6
+- **Heads**: 4

config.json ADDED Viewed

+{
+  "architectures": [
+    "ChessForCausalLM"
+  ],
+  "auto_map": {
+    "AutoConfig": "model.ChessConfig",
+    "AutoModelForCausalLM": "model.ChessForCausalLM"
+  },
+  "bos_token_id": 1,
+  "dropout": 0.1,
+  "dtype": "float32",
+  "eos_token_id": 2,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "chess_transformer",
+  "n_ctx": 256,
+  "n_embd": 128,
+  "n_head": 4,
+  "n_inner": 360,
+  "n_layer": 6,
+  "pad_token_id": 0,
+  "tie_weights": true,
+  "transformers_version": "4.57.5",
+  "vocab_size": 84
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6bf6f004d0a03e98d7649ceda872842d4f96fbd429fa47b01857e92c3cad18b9
+size 4002544

special_tokens_map.json ADDED Viewed

+{
+  "bos_token": "[BOS]",
+  "eos_token": "[EOS]",
+  "pad_token": "[PAD]",
+  "unk_token": "[UNK]"
+}

tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[BOS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "[EOS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "auto_map": {
+    "AutoTokenizer": [
+      "tokenizer.ChessTokenizer",
+      null
+    ]
+  },
+  "bos_token": "[BOS]",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "[EOS]",
+  "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "tokenizer_class": "ChessTokenizer",
+  "unk_token": "[UNK]"
+}

vocab.json ADDED Viewed

+{
+  "[PAD]": 0,
+  "[BOS]": 1,
+  "[EOS]": 2,
+  "[UNK]": 3,
+  "SIDE_W": 4,
+  "SIDE_B": 5,
+  "PIECE_P": 6,
+  "PIECE_N": 7,
+  "PIECE_B": 8,
+  "PIECE_R": 9,
+  "PIECE_Q": 10,
+  "PIECE_K": 11,
+  "SQ_a1": 12,
+  "SQ_a2": 13,
+  "SQ_a3": 14,
+  "SQ_a4": 15,
+  "SQ_a5": 16,
+  "SQ_a6": 17,
+  "SQ_a7": 18,
+  "SQ_a8": 19,
+  "SQ_b1": 20,
+  "SQ_b2": 21,
+  "SQ_b3": 22,
+  "SQ_b4": 23,
+  "SQ_b5": 24,
+  "SQ_b6": 25,
+  "SQ_b7": 26,
+  "SQ_b8": 27,
+  "SQ_c1": 28,
+  "SQ_c2": 29,
+  "SQ_c3": 30,
+  "SQ_c4": 31,
+  "SQ_c5": 32,
+  "SQ_c6": 33,
+  "SQ_c7": 34,
+  "SQ_c8": 35,
+  "SQ_d1": 36,
+  "SQ_d2": 37,
+  "SQ_d3": 38,
+  "SQ_d4": 39,
+  "SQ_d5": 40,
+  "SQ_d6": 41,
+  "SQ_d7": 42,
+  "SQ_d8": 43,
+  "SQ_e1": 44,
+  "SQ_e2": 45,
+  "SQ_e3": 46,
+  "SQ_e4": 47,
+  "SQ_e5": 48,
+  "SQ_e6": 49,
+  "SQ_e7": 50,
+  "SQ_e8": 51,
+  "SQ_f1": 52,
+  "SQ_f2": 53,
+  "SQ_f3": 54,
+  "SQ_f4": 55,
+  "SQ_f5": 56,
+  "SQ_f6": 57,
+  "SQ_f7": 58,
+  "SQ_f8": 59,
+  "SQ_g1": 60,
+  "SQ_g2": 61,
+  "SQ_g3": 62,
+  "SQ_g4": 63,
+  "SQ_g5": 64,
+  "SQ_g6": 65,
+  "SQ_g7": 66,
+  "SQ_g8": 67,
+  "SQ_h1": 68,
+  "SQ_h2": 69,
+  "SQ_h3": 70,
+  "SQ_h4": 71,
+  "SQ_h5": 72,
+  "SQ_h6": 73,
+  "SQ_h7": 74,
+  "SQ_h8": 75,
+  "PROMO_Q": 76,
+  "PROMO_R": 77,
+  "PROMO_B": 78,
+  "PROMO_N": 79,
+  "CAPTURE": 80,
+  "CHECK": 81,
+  "MATE": 82,
+  "CASTLE": 83
+}