cc44155
dd4da83
cc44155
c2d1e63
cc44155
dd4da83 | | from sklearn.feature_extraction.text import TfidfVectorizer
def do_tfidf(token):
tfidf = TfidfVectorizer(max_df=0.05, min_df=0.002)
words = tfidf.fit_transform(token)
sentence = " ".join(tfidf.get_feature_names())
return sentence
|