SafeSpaceAI / src /nlp /embeddings.py
Shreya Pal
Make API Key private
5c5b473
raw
history blame contribute delete
241 Bytes
from sklearn.feature_extraction.text import TfidfVectorizer
vectorizer = TfidfVectorizer(max_features=5000)
def fit_vectorizer(texts):
return vectorizer.fit(texts)
def transform(texts):
return vectorizer.transform(texts).toarray()