File size: 248 Bytes
cc44155
 
dd4da83
cc44155
c2d1e63
cc44155
 
dd4da83
1
2
3
4
5
6
7
8
9
from sklearn.feature_extraction.text import TfidfVectorizer


def do_tfidf(token):
    tfidf = TfidfVectorizer(max_df=0.05, min_df=0.002)
    words = tfidf.fit_transform(token)
    sentence = " ".join(tfidf.get_feature_names())
    return sentence