Diabetes_readmission / models /baseline_tfidf.py
Parishri07's picture
Upload 11 files
dda3dc2 verified
raw
history blame contribute delete
494 Bytes
from sklearn.pipeline import Pipeline
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.linear_model import LogisticRegression
def build_tfidf_model():
model = Pipeline([
("tfidf", TfidfVectorizer(
max_features=20000,
ngram_range=(1, 2),
stop_words="english"
)),
("clf", LogisticRegression(
max_iter=1000,
class_weight="balanced"
))
])
return model