lab4 / src /Vectorization.py
Shu-vi's picture
Upload 8 files
d4d8ed5 verified
raw
history blame contribute delete
853 Bytes
from gensim.models import Word2Vec, FastText
import joblib
def create_tfidf():
vectorizer = joblib.load("tfidf_vectorizer.pkl")
def _inner(docs):
return vectorizer.transform(docs).toarray()
return _inner, vectorizer # возвращаем и функцию, и векторaйзер
def create_w2v():
model = Word2Vec.load("./word2vec.model")
def _inner(word):
if word in model.wv:
return model.wv[word]
else:
return None
return _inner, model # возвращаем и функцию, и модель
def create_fasttext():
model = FastText.load("./fasttext.model")
def _inner(word):
if word in model.wv:
return model.wv[word]
else:
return None
return _inner, model # возвращаем и функцию, и модель