File size: 1,928 Bytes
53b92fc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
# utils/scenario_engine.py
import pandas as pd
import joblib
from utils.models import load_model  # your existing model loader

def simulate_scenario(feature, change, filter=None):
    """
    Dynamic scenario simulator that adapts to any dataset/model schema.
    """

    # 1️⃣ Load dataset and model
    df = pd.read_csv("appdata_rf.csv")
    model = load_model("models/app_best.joblib")

    # 2️⃣ Dynamically read model feature names
    expected_features = getattr(model, "feature_names_in_", list(df.select_dtypes(include='number').columns))
    print("Model expects:", expected_features)

    # 3️⃣ Parse change instruction
    try:
        pct_change = float(change.replace("%", "")) / 100 if "%" in change else float(change)
    except ValueError:
        return {"summary": f"⚠️ Invalid change value '{change}'", "df": df}

    # 4️⃣ Apply filter if any
    try:
        subset = df.query(filter) if filter else df.copy()
    except Exception as e:
        return {"summary": f"⚠️ Invalid filter '{filter}': {e}", "df": df}

    # 5️⃣ Apply the change dynamically
    if feature not in df.columns:
        return {"summary": f"⚠️ Feature '{feature}' not found in dataset.", "df": df}

    subset[feature] *= (1 + pct_change)
    if filter:
        df.loc[subset.index, feature] = subset[feature]
    else:
        df = subset

    # 6️⃣ Predict new churn rate using expected model inputs
    try:
        X = df[expected_features]
        churn_prob = model.predict_proba(X)[:, 1]
        new_churn_rate = churn_prob.mean() * 100
    except Exception as e:
        return {"summary": f"⚠️ Prediction error: {e}", "df": df}

    # 7️⃣ Return result
    summary = (
        f"📊 New churn rate = {new_churn_rate:.2f}% "
        f"after changing **{feature}** by {change}."
        + (f" (Filter: {filter})" if filter else "")
    )
    return {"summary": summary, "df": df}