File size: 119 Bytes
09daf0b
 
 
 
 
 
1
2
3
4
5
6
7
import re

def tokenize(text):
    text = text.lower()
    text = re.sub(r"[^\w\s]", "", text)
    return text.split()