Spaces:

singhn9
/

SteelAI_Module2_EAF_Intelligence_Explorer

Sleeping

App Files Files Community

singhn9 commited on Nov 7, 2025

Commit

b056229

verified ·

1 Parent(s): 9a0d8df

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +345 -101

src/streamlit_app.py CHANGED Viewed

@@ -361,115 +361,359 @@ with tabs[3]:
     st.dataframe(df.describe().T.style.format("{:.3f}"), height=500)
-# ----- Ensemble + SHAP tab
 with tabs[4]:
-    st.subheader("Autonomous Ensemble Modeling + SHAP Explainability")
-    # --- Step 1: Basic UI selections ---
-    target = st.selectbox("Target variable", numeric_cols, index=numeric_cols.index("furnace_temp") if "furnace_temp" in numeric_cols else 0)
-    default_features = [c for c in numeric_cols if c != target][:60]
-    features = st.multiselect("Model input features", numeric_cols, default=default_features)
-    sample_size = st.slider("Sample rows for training", 500, min(4000, df.shape[0]), 1000, step=100)
-    sub_df = df[features + [target]].sample(n=sample_size, random_state=42)
-    X = sub_df[features].fillna(0)
-    y = sub_df[target].fillna(0)
-    # --- Step 2: Business / Process Objective selection ---
-    st.markdown("### 🎯 Select Operational Objective")
-    objective = st.selectbox(
-        "Optimization Objective",
         [
-            "Maximize Accuracy (R²)",
-            "Minimize RMSE (Stable Control)",
-            "Maximize Yield Ratio (EAF/Inventory)",
-            "Minimize Energy Consumption (Efficiency)",
-            "Balanced (Accuracy + Efficiency)"
         ],
-        index=0
     )
-    # --- Step 3: Auto-tuning with Optuna ---
-    import optuna
-    from sklearn.model_selection import cross_val_score
-    st.markdown("### ⚙️ Auto Tuning in Progress")
-    def objective_fn(trial):
-        model_name = trial.suggest_categorical("model", ["RandomForest", "GradientBoosting", "ExtraTrees"])
-        n_estimators = trial.suggest_int("n_estimators", 100, 600)
-        max_depth = trial.suggest_int("max_depth", 3, 20)
-        learning_rate = trial.suggest_float("learning_rate", 0.01, 0.3, log=True)
-        if model_name == "RandomForest":
-            model = RandomForestRegressor(n_estimators=n_estimators, max_depth=max_depth, n_jobs=-1)
-        elif model_name == "GradientBoosting":
-            model = GradientBoostingRegressor(n_estimators=n_estimators, learning_rate=learning_rate, max_depth=max_depth)
-        else:
-            model = ExtraTreesRegressor(n_estimators=n_estimators, max_depth=max_depth, n_jobs=-1)
-        # Metric selection
-        scoring_metric = "r2"
-        if "RMSE" in objective:
-            scoring_metric = "neg_root_mean_squared_error"
-        score = cross_val_score(model, X, y, cv=3, scoring=scoring_metric).mean()
-        return score
-    if st.button("Run Auto Ensemble Optimization"):
-        with st.spinner("Optimizing models... please wait (~20–60s)"):
-            study = optuna.create_study(direction="maximize")
-            study.optimize(objective_fn, n_trials=20)
-            best_params = study.best_params
-            st.success("✅ Best Auto-Tuned Model Found")
-            st.json(best_params)
-            # Build best model
-            model_name = best_params.pop("model")
-            if model_name == "RandomForest":
-                model = RandomForestRegressor(**best_params)
-            elif model_name == "GradientBoosting":
-                model = GradientBoostingRegressor(**best_params)
             else:
-                model = ExtraTreesRegressor(**best_params)
-            model.fit(X, y)
-            # Save model
-            joblib.dump(model, ENSEMBLE_ARTIFACT)
-            st.caption(f"Model saved: {ENSEMBLE_ARTIFACT}")
-            # --- Auto Visualizations ---
-            st.markdown("### 📈 Optimization History")
-            fig_hist = optuna.visualization.matplotlib.plot_optimization_history(study)
-            st.pyplot(fig_hist)
-            # Predictions
-            X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
-            y_pred = model.predict(X_test)
-            r2 = r2_score(y_test, y_pred)
-            rmse = mean_squared_error(y_test, y_pred, squared=False)
-            st.metric("R² Score", f"{r2:.3f}")
-            st.metric("RMSE", f"{rmse:.3f}")
-            # Scatter plot
-            fig, ax = plt.subplots(figsize=(7,4))
-            ax.scatter(y_test, y_pred, alpha=0.6)
-            ax.plot([y_test.min(), y_test.max()], [y_test.min(), y_test.max()], "r--")
-            ax.set_xlabel("Actual"); ax.set_ylabel("Predicted")
-            st.pyplot(fig)
-            # --- SHAP Explainability for Best Model ---
-            st.markdown("### 🔍 SHAP Explainability (Auto Model)")
-            explainer = shap.TreeExplainer(model)
-            shap_values = explainer.shap_values(X_test.sample(300))
-            fig_shap = plt.figure(figsize=(8,6))
-            shap.summary_plot(shap_values, X_test.sample(300), show=False)
-            st.pyplot(fig_shap)
-            st.info("Auto tuning complete. Model performance and SHAP summary shown above.")
 # -----  Target & Business Impact tab
 with tabs[5]:

     st.dataframe(df.describe().T.style.format("{:.3f}"), height=500)
+# ----- Ensemble + SHAP tab (Expanded AutoML + Stacking + Multi-Family) -----
 with tabs[4]:
+    st.subheader(" AutoML Ensemble — Expanded Families + Stacking + SHAP")
+    # --- Step 0: High-level Use Case (keeps previous defaults) ---
+    st.markdown("###  Choose Industrial Use Case ")
+    use_case = st.selectbox(
+        "Select Use Case",
         [
+            "Predictive Maintenance",
+            "EAF Data Intelligence",
+            "Casting Quality Optimization",
+            "Rolling Mill Energy Optimization",
+            "Surface Defect Detection (Vision AI)",
+            "Material Composition & Alloy Mix AI",
+            "Inventory & Yield Optimization",
+            "Refractory & Cooling Loss Prediction"
         ],
+        index=1
     )
+    # Map use-case -> defaults (same as before)
+    use_case_config = {
+        "Predictive Maintenance": {"target": "bearing_temp", "model_hint": "RandomForest"},
+        "EAF Data Intelligence": {"target": "furnace_temp", "model_hint": "GradientBoosting"},
+        "Casting Quality Optimization": {"target": "surface_temp" if "surface_temp" in numeric_cols else "furnace_temp", "model_hint": "GradientBoosting"},
+        "Rolling Mill Energy Optimization": {"target": "energy_efficiency", "model_hint": "ExtraTrees"},
+        "Surface Defect Detection (Vision AI)": {"target": "image_entropy_proxy", "model_hint": "GradientBoosting"},
+        "Material Composition & Alloy Mix AI": {"target": "chemical_C", "model_hint": "RandomForest"},
+        "Inventory & Yield Optimization": {"target": "yield_ratio", "model_hint": "GradientBoosting"},
+        "Refractory & Cooling Loss Prediction": {"target": "lining_thickness", "model_hint": "ExtraTrees"},
+    }
+    cfg = use_case_config.get(use_case, {"target": numeric_cols[0], "model_hint": "RandomForest"})
+    target = cfg["target"]
+    model_hint = cfg["model_hint"]
+    # --- Feature auto-suggestion (keeps your earlier heuristic) ---
+    suggested = [c for c in numeric_cols if any(k in c for k in target.split('_'))]
+    if len(suggested) < 6:
+        suggested = [c for c in numeric_cols if any(k in c for k in ["temp", "power", "energy", "pressure", "yield"])]
+    if len(suggested) < 6:
+        suggested = numeric_cols[:50]
+    features = st.multiselect("Model input features (auto-suggested)", numeric_cols, default=suggested)
+    st.markdown(f"Auto target: `{target}` · Suggested family hint: `{model_hint}`")
+    # --- Data sampling controls ---
+    max_rows = min(df.shape[0], 20000)
+    sample_size = st.slider("Sample rows (train speed vs fidelity)", 500, max_rows, min(1500, max_rows), step=100)
+    sub_df = df[features + [target]].sample(n=sample_size, random_state=42).reset_index(drop=True)
+    X = sub_df[features].fillna(0)
+    y = sub_df[target].fillna(0)
+    # --- Ensemble control UI ---
+    st.markdown("### Ensemble & AutoML Settings")
+    max_trials = st.slider("Optuna trials per family (total trials grow with families)", 5, 80, 20, step=5)
+    top_k = st.slider("Max base models to keep in final ensemble", 2, 8, 5)
+    allow_advanced = st.checkbox("Include advanced families (XGBoost, LightGBM, CatBoost, TabPFN if installed)", value=True)
+    # --- Conditional imports (graceful fallbacks) ---
+    available_models = ["RandomForest", "ExtraTrees"]  # always available (sklearn)
+    optional_families = {}
+    if allow_advanced:
+        try:
+            import xgboost as xgb
+            optional_families["XGBoost"] = True
+            available_models.append("XGBoost")
+        except Exception:
+            optional_families["XGBoost"] = False
+        try:
+            import lightgbm as lgb
+            optional_families["LightGBM"] = True
+            available_models.append("LightGBM")
+        except Exception:
+            optional_families["LightGBM"] = False
+        try:
+            import catboost as cb
+            optional_families["CatBoost"] = True
+            available_models.append("CatBoost")
+        except Exception:
+            optional_families["CatBoost"] = False
+        try:
+            # TabPFN is often packaged differently; attempt import but it's optional
+            import tabpfn
+            optional_families["TabPFN"] = True
+            available_models.append("TabPFN")
+        except Exception:
+            optional_families["TabPFN"] = False
+        try:
+            # FT-Transformer optional
+            from pytorch_tabular.models import transformers  # may not be installed
+            optional_families["FTTransformer"] = True
+            available_models.append("FTTransformer")
+        except Exception:
+            optional_families["FTTransformer"] = False
+    st.markdown(f"Available model families: {', '.join(available_models)}")
+    # --- Optuna tuning routine per family ---
+    import optuna
+    from sklearn.model_selection import cross_val_score, KFold
+    from sklearn.ensemble import RandomForestRegressor, ExtraTreesRegressor
+    from sklearn.linear_model import Ridge
+    from sklearn.neural_network import MLPRegressor
+    from sklearn.metrics import r2_score, mean_squared_error
+    def tune_family(family_name, X_local, y_local, n_trials=20, random_state=42):
+        """Tune one model family using Optuna; returns best (model_obj, cv_score, best_params)."""
+        def obj(trial):
+            # sample hyperparams per family
+            if family_name == "RandomForest":
+                n_estimators = trial.suggest_int("n_estimators", 100, 800)
+                max_depth = trial.suggest_int("max_depth", 4, 30)
+                m = RandomForestRegressor(n_estimators=n_estimators, max_depth=max_depth, n_jobs=-1, random_state=random_state)
+            elif family_name == "ExtraTrees":
+                n_estimators = trial.suggest_int("n_estimators", 100, 800)
+                max_depth = trial.suggest_int("max_depth", 4, 30)
+                m = ExtraTreesRegressor(n_estimators=n_estimators, max_depth=max_depth, n_jobs=-1, random_state=random_state)
+            elif family_name == "XGBoost" and optional_families.get("XGBoost"):
+                n_estimators = trial.suggest_int("n_estimators", 100, 1000)
+                max_depth = trial.suggest_int("max_depth", 3, 12)
+                lr = trial.suggest_float("learning_rate", 0.01, 0.3, log=True)
+                m = xgb.XGBRegressor(n_estimators=n_estimators, max_depth=max_depth, learning_rate=lr, tree_method="hist", verbosity=0, random_state=random_state, n_jobs=1)
+            elif family_name == "LightGBM" and optional_families.get("LightGBM"):
+                n_estimators = trial.suggest_int("n_estimators", 100, 1000)
+                max_depth = trial.suggest_int("max_depth", 3, 16)
+                lr = trial.suggest_float("learning_rate", 0.01, 0.3, log=True)
+                m = lgb.LGBMRegressor(n_estimators=n_estimators, max_depth=max_depth, learning_rate=lr, n_jobs=1, random_state=random_state)
+            elif family_name == "CatBoost" and optional_families.get("CatBoost"):
+                iterations = trial.suggest_int("iterations", 200, 1000)
+                depth = trial.suggest_int("depth", 4, 10)
+                lr = trial.suggest_float("learning_rate", 0.01, 0.3, log=True)
+                m = cb.CatBoostRegressor(iterations=iterations, depth=depth, learning_rate=lr, verbose=0, random_state=random_state)
+            elif family_name == "MLP":
+                hidden = trial.suggest_int("hidden_layer_sizes", 32, 512, log=True)
+                lr = trial.suggest_float("learning_rate_init", 1e-4, 1e-1, log=True)
+                m = MLPRegressor(hidden_layer_sizes=(hidden,), learning_rate_init=lr, max_iter=500, random_state=random_state)
+            elif family_name == "TabPFN" and optional_families.get("TabPFN"):
+                # TabPFN often works without hyperparams exposure; return a surrogate score using quick fit
+                # We'll call its predict_proba style API if available; as fallback use a mean score to let stacking consider it.
+                # For tuning, just return a placeholder; we'll build model object later.
+                return 0.0
             else:
+                # fallback to a small RandomForest to avoid crashing
+                m = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=random_state, n_jobs=-1)
+            # use negative RMSE if better for our domain? keep R2 for generality
+            try:
+                scores = cross_val_score(m, X_local, y_local, scoring="r2", cv=3, n_jobs=1)
+                return float(np.mean(scores))
+            except Exception:
+                return -999.0
+        study = optuna.create_study(direction="maximize")
+        study.optimize(obj, n_trials=n_trials, show_progress_bar=False)
+        best = study.best_trial.params if study.trials else {}
+        # instantiate best model
+        try:
+            if family_name == "RandomForest":
+                model = RandomForestRegressor(n_estimators=best.get("n_estimators",200), max_depth=best.get("max_depth",8), n_jobs=-1, random_state=42)
+            elif family_name == "ExtraTrees":
+                model = ExtraTreesRegressor(n_estimators=best.get("n_estimators",200), max_depth=best.get("max_depth",8), n_jobs=-1, random_state=42)
+            elif family_name == "XGBoost" and optional_families.get("XGBoost"):
+                model = xgb.XGBRegressor(n_estimators=best.get("n_estimators",200), max_depth=best.get("max_depth",6), learning_rate=best.get("learning_rate",0.1), tree_method="hist", verbosity=0, random_state=42, n_jobs=1)
+            elif family_name == "LightGBM" and optional_families.get("LightGBM"):
+                model = lgb.LGBMRegressor(n_estimators=best.get("n_estimators",200), max_depth=best.get("max_depth",8), learning_rate=best.get("learning_rate",0.1), n_jobs=1, random_state=42)
+            elif family_name == "CatBoost" and optional_families.get("CatBoost"):
+                model = cb.CatBoostRegressor(iterations=best.get("iterations",200), depth=best.get("depth",6), learning_rate=best.get("learning_rate",0.1), verbose=0, random_state=42)
+            elif family_name == "MLP":
+                model = MLPRegressor(hidden_layer_sizes=(best.get("hidden_layer_sizes",128),), learning_rate_init=best.get("learning_rate_init",0.001), max_iter=500, random_state=42)
+            elif family_name == "TabPFN" and optional_families.get("TabPFN"):
+                # We'll create a small wrapper for TabPFN later on train time
+                model = "TabPFN_placeholder"
+            else:
+                model = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=42, n_jobs=-1)
+        except Exception:
+            model = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=42, n_jobs=-1)
+        # compute cross-validated score for the best model
+        try:
+            score = float(np.mean(cross_val_score(model, X_local, y_local, scoring="r2", cv=3, n_jobs=1)))
+        except Exception:
+            score = -999.0
+        return {"model_obj": model, "cv_score": score, "best_params": best, "family": family_name, "study": study}
+    # --- Run tuning across available families (user triggered) ---
+    run_btn = st.button(" Run expanded AutoML + Stacking")
+    if run_btn:
+        with st.spinner("Tuning multiple families (this may take a while depending on choices)..."):
+            families_to_try = ["RandomForest", "ExtraTrees", "MLP"]
+            if allow_advanced:
+                if optional_families.get("XGBoost"): families_to_try.append("XGBoost")
+                if optional_families.get("LightGBM"): families_to_try.append("LightGBM")
+                if optional_families.get("CatBoost"): families_to_try.append("CatBoost")
+                if optional_families.get("TabPFN"): families_to_try.append("TabPFN")
+                if optional_families.get("FTTransformer"): families_to_try.append("FTTransformer")
+            tuned_results = []
+            for fam in families_to_try:
+                st.caption(f"Tuning family: {fam}")
+                res = tune_family(fam, X, y, n_trials=max_trials)
+                # res can be dict or single-run result; ensure consistent format
+                if isinstance(res, dict) and "model_obj" in res:
+                    tuned_results.append(res)
+                else:
+                    st.warning(f"Family {fam} returned unexpected tune result: {res}")
+            # build leaderboard DataFrame
+            lb = pd.DataFrame([{"family": r["family"], "cv_r2": r["cv_score"], "params": r["best_params"]} for r in tuned_results])
+            lb = lb.sort_values("cv_r2", ascending=False).reset_index(drop=True)
+            st.markdown("### Tuning Leaderboard (by CV R²)")
+            st.dataframe(lb[["family","cv_r2"]].round(4))
+            # --- Build base-models and collect out-of-fold preds for stacking ---
+            st.markdown("### Building base models & out-of-fold predictions for stacking")
+            kf = KFold(n_splits=5, shuffle=True, random_state=42)
+            base_models = []
+            oof_preds = pd.DataFrame(index=X.index)
+            for idx, row in lb.iterrows():
+                fam = row["family"]
+                model_entry = next((r for r in tuned_results if r["family"] == fam), None)
+                if model_entry is None:
+                    continue
+                model_obj = model_entry["model_obj"]
+                # train out-of-fold predictions
+                oof = np.zeros(X.shape[0])
+                for tr_idx, val_idx in kf.split(X):
+                    X_tr, X_val = X.iloc[tr_idx], X.iloc[val_idx]
+                    y_tr = y.iloc[tr_idx]
+                    # fit family-specific wrapper (TabPFN/FTTransformer special-case)
+                    if model_obj == "TabPFN_placeholder":
+                        try:
+                            # TabPFN expects specific API; create a simple fallback: use RandomForest to approximate
+                            tmp = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=42, n_jobs=-1)
+                            tmp.fit(X_tr, y_tr)
+                            oof[val_idx] = tmp.predict(X_val)
+                        except Exception:
+                            oof[val_idx] = np.mean(y_tr)
+                    else:
+                        try:
+                            model_obj.fit(X_tr, y_tr)
+                            oof[val_idx] = model_obj.predict(X_val)
+                        except Exception:
+                            # fallback to mean
+                            oof[val_idx] = np.mean(y_tr)
+                oof_preds[f"{fam}_oof"] = oof
+                # finally fit model on full data
+                try:
+                    if model_entry["model_obj"] == "TabPFN_placeholder":
+                        # fallback full-model: RandomForest
+                        fitted = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=42, n_jobs=-1)
+                        fitted.fit(X, y)
+                    else:
+                        model_entry["model_obj"].fit(X, y)
+                        fitted = model_entry["model_obj"]
+                except Exception:
+                    fitted = RandomForestRegressor(n_estimators=200, max_depth=8, random_state=42, n_jobs=-1)
+                    fitted.fit(X, y)
+                base_models.append({"family": fam, "model": fitted, "cv_r2": model_entry["cv_score"]})
+            # --- prune highly correlated OOF preds and keep top_k diverse models ---
+            if oof_preds.shape[1] == 0:
+                st.error("No base models created — aborting stacking.")
+            else:
+                corr_matrix = oof_preds.corr().abs()
+                # compute diversity score = (1 - mean correlation with others)
+                diversity = {col: 1 - corr_matrix[col].drop(col).mean() for col in corr_matrix.columns}
+                summary = []
+                for bm in base_models:
+                    col = f"{bm['family']}_oof"
+                    summary.append({"family": bm["family"], "cv_r2": bm["cv_r2"], "diversity": diversity.get(col, 0.0)})
+                summary_df = pd.DataFrame(summary).sort_values(["cv_r2", "diversity"], ascending=[False, False]).reset_index(drop=True)
+                st.markdown("### Base Model Summary (cv_r2, diversity)")
+                st.dataframe(summary_df.round(4))
+                # select top_k by cv_r2 and diversity combined
+                selected = summary_df.sort_values(["cv_r2","diversity"], ascending=[False, False]).head(top_k)["family"].tolist()
+                st.markdown(f"Selected for stacking (top {top_k}): {selected}")
+                # build stacking training data (OOF preds for selected)
+                selected_cols = [f"{s}_oof" for s in selected]
+                X_stack = oof_preds[selected_cols].fillna(0)
+                meta = Ridge(alpha=1.0)
+                meta.fit(X_stack, y)
+                # evaluate stacked ensemble on a holdout split
+                X_tr, X_val, y_tr, y_val = train_test_split(X, y, test_size=0.2, random_state=42)
+                # predict with base models -> create meta inputs
+                meta_inputs = []
+                for fam in selected:
+                    bm = next((b for b in base_models if b["family"] == fam), None)
+                    if bm is not None:
+                        try:
+                            meta_inputs.append(bm["model"].predict(X_val))
+                        except Exception:
+                            meta_inputs.append(np.full(len(X_val), y_tr.mean()))
+                    else:
+                        meta_inputs.append(np.full(len(X_val), y_tr.mean()))
+                X_meta_val = np.column_stack(meta_inputs)
+                y_meta_pred = meta.predict(X_meta_val)
+                final_r2 = r2_score(y_val, y_meta_pred)
+                final_rmse = mean_squared_error(y_val, y_meta_pred, squared=False)
+                c1, c2 = st.columns(2)
+                c1.metric("Stacked Ensemble R² (holdout)", f"{final_r2:.4f}")
+                c2.metric("Stacked Ensemble RMSE (holdout)", f"{final_rmse:.4f}")
+                # scatter plot
+                fig, ax = plt.subplots(figsize=(7,4))
+                ax.scatter(y_val, y_meta_pred, alpha=0.6)
+                ax.plot([y_val.min(), y_val.max()], [y_val.min(), y_val.max()], "r--")
+                ax.set_xlabel("Actual"); ax.set_ylabel("Stacked Predicted")
+                st.pyplot(fig)
+                # save artifacts: base models list + meta learner
+                stack_artifact = os.path.join(DATA_DIR, f"stacked_{use_case.replace(' ','_')}.joblib")
+                to_save = {"base_models": {bm["family"]: bm["model"] for bm in base_models if bm["family"] in selected}, "meta": meta, "features": features, "selected": selected, "target": target}
+                joblib.dump(to_save, stack_artifact)
+                st.caption(f"Stacked ensemble saved: {stack_artifact}")
+                # --- SHAP on final stack: approximate by SHAP of top base model or meta contributions ---
+                st.markdown("### Explainability (approximate)")
+                try:
+                    # Prefer SHAP on top base model (tree) for interpretability
+                    top_base = next((b for b in base_models if b["family"] == selected[0]), None)
+                    if top_base is not None and hasattr(top_base["model"], "predict"):
+                        # sample for speed
+                        sample_X = X_val.sample(min(300, len(X_val)), random_state=42)
+                        if hasattr(top_base["model"], "predict") and ("XGBoost" in top_base["family"] or "LightGBM" in top_base["family"] or "RandomForest" in top_base["family"] or "ExtraTrees" in top_base["family"] or "CatBoost" in top_base["family"]):
+                            expl = None
+                            # safe tree explainer creation
+                            try:
+                                expl = shap.TreeExplainer(top_base["model"])
+                                shap_vals = expl.shap_values(sample_X)
+                                fig_sh = plt.figure(figsize=(8,6))
+                                shap.summary_plot(shap_vals, sample_X, show=False)
+                                st.pyplot(fig_sh)
+                            except Exception as e:
+                                st.warning(f"SHAP tree explainer unavailable: {e}")
+                        else:
+                            st.info("Top base model not tree-based; SHAP summary skipped. You can inspect per-base feature importances above.")
+                    else:
+                        st.info("No suitable base model for SHAP explanation found.")
+                except Exception as e:
+                    st.warning(f"SHAP step failed gracefully: {e}")
+                st.success("AutoML + Stacking complete. Review metrics and saved artifacts.")
 # -----  Target & Business Impact tab
 with tabs[5]: