yczhang commited on
Commit
021778d
·
1 Parent(s): 633ca6d

Update: fix bug

Browse files
Files changed (1) hide show
  1. tokenization_interns1.py +1 -0
tokenization_interns1.py CHANGED
@@ -450,6 +450,7 @@ class InternS1Tokenizer(PreTrainedTokenizer):
450
  pad_token="<|endoftext|>",
451
  clean_up_tokenization_spaces=False,
452
  split_special_tokens=False,
 
453
  **kwargs,
454
  ):
455
  bos_token = (
 
450
  pad_token="<|endoftext|>",
451
  clean_up_tokenization_spaces=False,
452
  split_special_tokens=False,
453
+ special_tokens_pattern="none",
454
  **kwargs,
455
  ):
456
  bos_token = (