yczhang commited on
Commit ·
021778d
1
Parent(s): 633ca6d
Update: fix bug
Browse files- tokenization_interns1.py +1 -0
tokenization_interns1.py
CHANGED
|
@@ -450,6 +450,7 @@ class InternS1Tokenizer(PreTrainedTokenizer):
|
|
| 450 |
pad_token="<|endoftext|>",
|
| 451 |
clean_up_tokenization_spaces=False,
|
| 452 |
split_special_tokens=False,
|
|
|
|
| 453 |
**kwargs,
|
| 454 |
):
|
| 455 |
bos_token = (
|
|
|
|
| 450 |
pad_token="<|endoftext|>",
|
| 451 |
clean_up_tokenization_spaces=False,
|
| 452 |
split_special_tokens=False,
|
| 453 |
+
special_tokens_pattern="none",
|
| 454 |
**kwargs,
|
| 455 |
):
|
| 456 |
bos_token = (
|