opinion-summarizer / src /utils /text_utils.py
Anshrathore01's picture
Remove tracked venv and refine gitignore
6f953dc
raw
history blame contribute delete
246 Bytes
from nltk.stem import PorterStemmer
from nltk.tokenize import word_tokenize
import re
ps = PorterStemmer()
def stem_text(text):
if not text:
return ""
tokens = word_tokenize(text)
return " ".join(ps.stem(t) for t in tokens)