PyTorch
gpt2
achille-fusco commited on
Commit
2e7d313
·
verified ·
1 Parent(s): af0c2c7

Update tokenizer.py

Browse files
Files changed (1) hide show
  1. tokenizer.py +1 -0
tokenizer.py CHANGED
@@ -251,6 +251,7 @@ class ParadigmTokenizerWrapper(PreTrainedTokenizerFast):
251
  or os.path.dirname(getattr(self, "tokenizer_file", "")) or "."
252
  revision = kwargs.get("revision", None)
253
 
 
254
  ppath = _get_repo_file(repo_id_or_path, "paradigms.json", revision)
255
  self.paradigms, self.paradigms_meta = _load_paradigms_any(ppath)
256
 
 
251
  or os.path.dirname(getattr(self, "tokenizer_file", "")) or "."
252
  revision = kwargs.get("revision", None)
253
 
254
+ cfg = {"lowercase": True, "space_punct": True}
255
  ppath = _get_repo_file(repo_id_or_path, "paradigms.json", revision)
256
  self.paradigms, self.paradigms_meta = _load_paradigms_any(ppath)
257