Spaces:

lsy641
/

distinct

Runtime error

lsy641 commited on Jul 8, 2023

Commit

c74a961

1 Parent(s): 2c7cea9

distinct

Files changed (1) hide show

tokenizer_13a.py CHANGED Viewed

@@ -67,8 +67,7 @@ class TokenizerRegexp(BaseTokenizer):
         # no leading or trailing spaces, single space within words
         # return ' '.join(line.split())
         # This line is changed with regards to the original tokenizer (seen above) to return individual words
-        print(line)
-        print("1:", line.split())
         return line.split()
@@ -98,7 +97,6 @@ class Tokenizer13a(BaseTokenizer):
             line = line.replace("&amp;", "&")
             line = line.replace("&lt;", "<")
             line = line.replace("&gt;", ">")
-        print(line)
         return self._post_tokenizer(f" {line} ")

         # no leading or trailing spaces, single space within words
         # return ' '.join(line.split())
         # This line is changed with regards to the original tokenizer (seen above) to return individual words
         return line.split()
             line = line.replace("&amp;", "&")
             line = line.replace("&lt;", "<")
             line = line.replace("&gt;", ">")
         return self._post_tokenizer(f" {line} ")