LLM-course
/

chess-hamonk-v12

Text Generation

chess_transformer

chess-challenge

Model card Files Files and versions

Kevin Hamon commited on Jan 19

Commit

1b49565

·

1 Parent(s): 6146bce

remove custom from_pretrained

Files changed (1) hide show

tokenizer.py +0 -29

tokenizer.py CHANGED Viewed

@@ -364,35 +364,6 @@ class ChessTokenizer(PreTrainedTokenizer):
                 # Non-fatal; we still saved vocab and config
                 pass
-    @classmethod
-    def from_pretrained(cls, load_directory: str) -> "ChessTokenizer":
-        """Load tokenizer from a directory previously written with `save_pretrained`.
-        This primarily reads the vocab file and constructs the tokenizer.
-        If a `tokenizer_config.json` exists it will be consulted for the
-        vocab filename and special tokens (but we still instantiate using
-        the provided class).
-        """
-        config_path = os.path.join(load_directory, "tokenizer_config.json")
-        vocab_file = None
-        if os.path.exists(config_path):
-            try:
-                with open(config_path, "r", encoding="utf-8") as f:
-                    cfg = json.load(f)
-                vocab_file = os.path.join(load_directory, cfg.get("vocab_file", "vocab.json"))
-            except Exception:
-                pass
-        if vocab_file is None:
-            # Fallback: look for a vocab file in the directory
-            candidates = [p for p in os.listdir(load_directory) if p.endswith("vocab.json")]
-            if candidates:
-                vocab_file = os.path.join(load_directory, candidates[0])
-        if vocab_file is None or not os.path.exists(vocab_file):
-            raise FileNotFoundError(f"No vocab file found in {load_directory}")
-        return cls(vocab_file=vocab_file)
 def count_vocab_from_dataset(
     dataset_name: str = "dlouapre/lichess_2025-01_1M",

                 # Non-fatal; we still saved vocab and config
                 pass
 def count_vocab_from_dataset(
     dataset_name: str = "dlouapre/lichess_2025-01_1M",