Spaces:
Sleeping
Sleeping
File size: 443 Bytes
fbb3f82 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 |
import spacy
nlp = spacy.load('en_core_web_sm')
def preprocesser(text_array):
preprocessed_texts = []
for text in text_array:
doc = nlp(text)
words_lst = []
for token in doc:
if not token.is_stop and not token.is_punct:
words_lst.append(token.lemma_)
preprocessed_text = " ".join(words_lst)
preprocessed_texts.append(preprocessed_text)
return preprocessed_texts |