| import pandas as pd |
| from sklearn.feature_extraction.text import TfidfVectorizer |
| from sklearn.linear_model import LogisticRegression |
|
|
| data = pd.read_csv('dataset.csv') |
| vectorizer = TfidfVectorizer() |
| X = vectorizer.fit_transform(data['text']) |
| y = data['label'] |
|
|
| classifier = LogisticRegression() |
| classifier.fit(X, y) |
|
|
| def predict(text): |
| text_vectorized = vectorizer.transform([text]) |
| prediction = classifier.predict(text_vectorized)[0] |
| if prediction == 'AI': |
| score = classifier.predict_proba(text_vectorized)[0][0] |
| else: |
| score = 1 - classifier.predict_proba(text_vectorized)[0][1] |
| response = [ |
| { |
| 'label': prediction, |
| 'score': round(float(score), 4) |
| } |
| ] |
| return response |
|
|