Update tokenizer.py
Browse files- tokenizer.py +3 -0
tokenizer.py
CHANGED
|
@@ -91,6 +91,9 @@ class MedTok(PreTrainedTokenizer):
|
|
| 91 |
"vocab_file": "vocab.json",
|
| 92 |
"code2tokens_file": "code2tokens.json",
|
| 93 |
"code2embedding_file": "code2embeddings.json",
|
|
|
|
|
|
|
|
|
|
| 94 |
}
|
| 95 |
with open(os.path.join(save_directory, "tokenizer_config.json"), "w") as f:
|
| 96 |
json.dump(tokenizer_config, f, indent=2)
|
|
|
|
| 91 |
"vocab_file": "vocab.json",
|
| 92 |
"code2tokens_file": "code2tokens.json",
|
| 93 |
"code2embedding_file": "code2embeddings.json",
|
| 94 |
+
"auto_map": {
|
| 95 |
+
"AutoTokenizer": "tokenizer.MedTok"
|
| 96 |
+
}
|
| 97 |
}
|
| 98 |
with open(os.path.join(save_directory, "tokenizer_config.json"), "w") as f:
|
| 99 |
json.dump(tokenizer_config, f, indent=2)
|