File size: 751 Bytes
63abdd9 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 | import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.linear_model import LogisticRegression
data = pd.read_csv('dataset.csv')
vectorizer = TfidfVectorizer()
X = vectorizer.fit_transform(data['text'])
y = data['label']
classifier = LogisticRegression()
classifier.fit(X, y)
def predict(text):
text_vectorized = vectorizer.transform([text])
prediction = classifier.predict(text_vectorized)[0]
if prediction == 'AI':
score = classifier.predict_proba(text_vectorized)[0][0]
else:
score = 1 - classifier.predict_proba(text_vectorized)[0][1]
response = [
{
'label': prediction,
'score': round(float(score), 4)
}
]
return response
|