ESGToolKit / embeddings.py
GirishaBuilds01's picture
Update embeddings.py
f283da3 verified
raw
history blame contribute delete
207 Bytes
from sklearn.feature_extraction.text import TfidfVectorizer
vectorizer = TfidfVectorizer(max_features=512)
def embed(text):
vec = vectorizer.fit_transform([text])
return vec.toarray()[0].tolist()