Update tokenizer.py
Browse files- tokenizer.py +1 -0
tokenizer.py
CHANGED
|
@@ -251,6 +251,7 @@ class ParadigmTokenizerWrapper(PreTrainedTokenizerFast):
|
|
| 251 |
or os.path.dirname(getattr(self, "tokenizer_file", "")) or "."
|
| 252 |
revision = kwargs.get("revision", None)
|
| 253 |
|
|
|
|
| 254 |
ppath = _get_repo_file(repo_id_or_path, "paradigms.json", revision)
|
| 255 |
self.paradigms, self.paradigms_meta = _load_paradigms_any(ppath)
|
| 256 |
|
|
|
|
| 251 |
or os.path.dirname(getattr(self, "tokenizer_file", "")) or "."
|
| 252 |
revision = kwargs.get("revision", None)
|
| 253 |
|
| 254 |
+
cfg = {"lowercase": True, "space_punct": True}
|
| 255 |
ppath = _get_repo_file(repo_id_or_path, "paradigms.json", revision)
|
| 256 |
self.paradigms, self.paradigms_meta = _load_paradigms_any(ppath)
|
| 257 |
|