Resume / scripts /utils /tf_idf.py
srbhr's picture
0.0.1 Canary-Releasing code for a second version. (#39)
539fbe4 unverified
raw
history blame contribute delete
248 Bytes
from sklearn.feature_extraction.text import TfidfVectorizer
def do_tfidf(token):
tfidf = TfidfVectorizer(max_df=0.05, min_df=0.002)
words = tfidf.fit_transform(token)
sentence = " ".join(tfidf.get_feature_names())
return sentence