|
|
import pandas as pd
|
|
|
import joblib
|
|
|
from sklearn.model_selection import train_test_split
|
|
|
from sklearn.linear_model import LogisticRegression
|
|
|
from sklearn.metrics import classification_report
|
|
|
import os
|
|
|
|
|
|
|
|
|
data = pd.read_csv("lead_data.csv")
|
|
|
|
|
|
|
|
|
data['lead_source'] = data['lead_source'].astype('category').cat.codes
|
|
|
data['region'] = data['region'].astype('category').cat.codes
|
|
|
|
|
|
|
|
|
X = data[['lead_source', 'response_time', 'activity_level', 'region']]
|
|
|
y = data['converted']
|
|
|
|
|
|
|
|
|
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2)
|
|
|
|
|
|
|
|
|
model = LogisticRegression(max_iter=200)
|
|
|
model.fit(X_train, y_train)
|
|
|
|
|
|
|
|
|
preds = model.predict(X_test)
|
|
|
print("\nModel Performance:\n")
|
|
|
print(classification_report(y_test, preds))
|
|
|
|
|
|
|
|
|
if not os.path.exists("model"):
|
|
|
os.mkdir("model")
|
|
|
|
|
|
joblib.dump(model, "model/model.pkl")
|
|
|
print("✅ Model saved as model/model.pkl")
|
|
|
|