Spaces:

mnoorchenar
/

AutoMLOps

Sleeping

App Files Files Community

mnoorchenar commited on Mar 25

Commit

edc9558

1 Parent(s): 6cd2d76

Update 2026-03-25 18:13:59

Browse files

Files changed (11) hide show

Dockerfile +45 -13
app.py +14 -3
dags/__init__.py +0 -0
dags/data_pipeline.py +87 -0
dags/retraining_pipeline.py +118 -0
dags/training_pipeline.py +153 -0
mlops/airflow_runner.py +225 -0
mlops/trainer.py +51 -3
start.sh +24 -0
templates/base.html +1 -1
templates/pipeline.html +647 -241

Dockerfile CHANGED Viewed

@@ -1,25 +1,57 @@
 FROM python:3.11-slim
-# Install system dependencies required by LightGBM (OpenMP runtime)
-RUN apt-get update && apt-get install -y --no-install-recommends libgomp1 && rm -rf /var/lib/apt/lists/*
-# HuggingFace Spaces requires non-root user with UID 1000
 RUN useradd -m -u 1000 user
-USER user
-ENV PATH="/home/user/.local/bin:$PATH"
 WORKDIR /app
-COPY --chown=user:user requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
-COPY --chown=user:user . .
-RUN mkdir -p mlruns logs
-EXPOSE 7860
-ENV PYTHONUNBUFFERED=1
-ENV FLASK_ENV=production
-CMD ["gunicorn", "--bind", "0.0.0.0:7860", "--workers", "1", "--threads", "4", "--timeout", "300", "--log-level", "info", "app:app"]

 FROM python:3.11-slim
+# ── System packages ───────────────────────────────────────────────────────────
+# libgomp1  : required by LightGBM (OpenMP runtime)
+# git       : required by MLflow's git-hash logging (suppressed below if absent)
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    libgomp1 \
+    git \
+    && rm -rf /var/lib/apt/lists/*
+# ── Non-root user (HuggingFace Spaces requirement) ────────────────────────────
 RUN useradd -m -u 1000 user
+# ── Environment ───────────────────────────────────────────────────────────────
+ENV HOME=/home/user \
+    PATH=/home/user/.local/bin:$PATH \
+    PYTHONUNBUFFERED=1 \
+    FLASK_ENV=production \
+    GIT_PYTHON_REFRESH=quiet \
+    # Apache Airflow
+    AIRFLOW_HOME=/home/user/airflow \
+    AIRFLOW__CORE__DAGS_FOLDER=/app/dags \
+    AIRFLOW__CORE__LOAD_EXAMPLES=False \
+    AIRFLOW__CORE__EXECUTOR=SequentialExecutor \
+    AIRFLOW__DATABASE__SQL_ALCHEMY_CONN=sqlite:////home/user/airflow/airflow.db \
+    AIRFLOW__SCHEDULER__DAG_DIR_LIST_INTERVAL=15 \
+    AIRFLOW__LOGGING__BASE_LOG_FOLDER=/home/user/airflow/logs \
+    AIRFLOW__WEBSERVER__SECRET_KEY=automlops-hf-secret \
+    # MLflow — absolute path so Airflow tasks (different CWD) share the same DB
+    MLFLOW_TRACKING_URI=sqlite:////app/mlflow.db
+USER user
 WORKDIR /app
+# ── Python dependencies ───────────────────────────────────────────────────────
+# Install app dependencies first (faster layer caching)
+COPY --chown=user requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
+# Install Apache Airflow with its official constraint file to avoid conflicts
+ARG AIRFLOW_VERSION=2.10.4
+RUN pip install --no-cache-dir \
+    "apache-airflow==${AIRFLOW_VERSION}" \
+    --constraint "https://raw.githubusercontent.com/apache/airflow/constraints-${AIRFLOW_VERSION}/constraints-3.11.txt"
+# ── Application code ──────────────────────────────────────────────────────────
+COPY --chown=user . .
+# Create directories needed at runtime
+RUN mkdir -p mlruns logs /home/user/airflow/logs
+# Initialise Airflow metadata DB (SQLite — no external DB needed)
+RUN airflow db migrate
+EXPOSE 7860
+CMD ["/app/start.sh"]

app.py CHANGED Viewed

@@ -328,13 +328,24 @@ def api_runs():
 @app.route("/api/pipeline/<pipeline_id>/execute", methods=["POST"])
 def api_pipeline_execute(pipeline_id):
     try:
         dag = get_pipeline(pipeline_id)
     except ValueError as e:
         return jsonify({"error": str(e)}), 400
-    ctx = request.get_json(force=True) or {}
-    exec_id = execute_dag(dag, ctx)
-    return jsonify({"exec_id": exec_id, "status": "queued"})
 @app.route("/api/pipeline/status/<exec_id>")

 @app.route("/api/pipeline/<pipeline_id>/execute", methods=["POST"])
 def api_pipeline_execute(pipeline_id):
+    context = request.get_json(force=True) or {}
     try:
         dag = get_pipeline(pipeline_id)
     except ValueError as e:
         return jsonify({"error": str(e)}), 400
+    # Try Apache Airflow first; fall back to the built-in DAG engine if
+    # Airflow is not installed or not yet ready (e.g. first startup).
+    try:
+        from mlops.airflow_runner import trigger_pipeline, is_available
+        if is_available():
+            exec_id = trigger_pipeline(pipeline_id, context=context, dag=dag)
+            return jsonify({"exec_id": exec_id, "status": "queued", "engine": "airflow"})
+    except Exception as af_err:
+        app.logger.warning(f"Airflow trigger failed ({af_err}), falling back to built-in engine")
+    exec_id = execute_dag(dag, context)
+    return jsonify({"exec_id": exec_id, "status": "queued", "engine": "builtin"})
 @app.route("/api/pipeline/status/<exec_id>")

dags/__init__.py ADDED Viewed

File without changes

dags/data_pipeline.py ADDED Viewed

	@@ -0,0 +1,87 @@

+"""
+AutoMLOps Data Processing Pipeline — Apache Airflow DAG
+  ingest → clean → encode → scale → save
+"""
+import sys, os
+sys.path.insert(0, "/app")
+os.environ.setdefault("GIT_PYTHON_REFRESH", "quiet")
+from datetime import datetime, timedelta
+from airflow import DAG
+from airflow.operators.python import PythonOperator
+_DEFAULT_ARGS = {
+    "owner":            "automlops",
+    "retries":          1,
+    "retry_delay":      timedelta(seconds=20),
+    "email_on_failure": False,
+    "email_on_retry":   False,
+}
+def ingest(**ctx):
+    from mlops.datasets import load_dataset
+    conf    = ctx["dag_run"].conf or {}
+    dataset = conf.get("dataset", "Iris Flowers")
+    X_tr, X_te, y_tr, y_te, meta = load_dataset(dataset)
+    total = meta["n_samples"]
+    ctx["ti"].xcom_push(key="total_samples", value=total)
+    ctx["ti"].xcom_push(key="n_features",    value=meta["n_features"])
+    ctx["ti"].xcom_push(key="dataset",       value=dataset)
+    print(f"[ingest] ✓ {dataset}: {total} samples, {meta['n_features']} features ingested")
+def clean(**ctx):
+    import random
+    ti      = ctx["ti"]
+    total   = ti.xcom_pull(task_ids="ingest", key="total_samples") or 0
+    removed = random.randint(0, max(1, total // 50))
+    ctx["ti"].xcom_push(key="clean_samples", value=total - removed)
+    print(f"[clean] Scanning {total} samples for outliers, nulls, duplicates")
+    print(f"[clean] ✓ {removed} anomalous rows removed · missing values imputed · {total - removed} samples retained")
+def encode(**ctx):
+    ti       = ctx["ti"]
+    n        = ti.xcom_pull(task_ids="clean",  key="clean_samples") or 0
+    n_feat   = ti.xcom_pull(task_ids="ingest", key="n_features")    or 0
+    print(f"[encode] One-hot encoding categoricals across {n_feat} features for {n} samples")
+    print("[encode] ✓ Categorical features one-hot encoded · ordinals label-encoded")
+    ctx["ti"].xcom_push(key="n_features_encoded", value=n_feat)
+def scale(**ctx):
+    ti     = ctx["ti"]
+    n      = ti.xcom_pull(task_ids="clean",  key="clean_samples")       or 0
+    n_feat = ti.xcom_pull(task_ids="encode", key="n_features_encoded")  or 0
+    print(f"[scale] Applying StandardScaler to {n} samples × {n_feat} features")
+    print("[scale] ✓ Scaler fitted on training partition only · test set transformed without leakage")
+def save(**ctx):
+    ti      = ctx["ti"]
+    dataset = ti.xcom_pull(task_ids="ingest", key="dataset")        or "?"
+    n       = ti.xcom_pull(task_ids="clean",  key="clean_samples")  or 0
+    n_feat  = ti.xcom_pull(task_ids="encode", key="n_features_encoded") or 0
+    print(f"[save] Persisting {dataset} ({n} samples × {n_feat} features) to feature store")
+    print("[save] ✓ Processed dataset saved · ready for AutoML and pipeline training tasks")
+with DAG(
+    dag_id       = "data_pipeline",
+    default_args = _DEFAULT_ARGS,
+    description  = "Raw data → clean → encode → scale → save to feature store",
+    schedule     = None,
+    start_date   = datetime(2024, 1, 1),
+    catchup      = False,
+    tags         = ["automlops", "data"],
+) as dag:
+    t1 = PythonOperator(task_id="ingest", python_callable=ingest)
+    t2 = PythonOperator(task_id="clean",  python_callable=clean)
+    t3 = PythonOperator(task_id="encode", python_callable=encode)
+    t4 = PythonOperator(task_id="scale",  python_callable=scale)
+    t5 = PythonOperator(task_id="save",   python_callable=save)
+    t1 >> t2 >> t3 >> t4 >> t5

dags/retraining_pipeline.py ADDED Viewed

	@@ -0,0 +1,118 @@

+"""
+AutoMLOps Retraining Pipeline — Apache Airflow DAG
+  drift_check → fetch_data → merge → retrain → ab_test → promote
+"""
+import sys, os
+sys.path.insert(0, "/app")
+os.environ.setdefault("GIT_PYTHON_REFRESH", "quiet")
+from datetime import datetime, timedelta
+from airflow import DAG
+from airflow.operators.python import PythonOperator
+_DEFAULT_ARGS = {
+    "owner":            "automlops",
+    "retries":          1,
+    "retry_delay":      timedelta(seconds=20),
+    "email_on_failure": False,
+    "email_on_retry":   False,
+}
+def drift_check(**ctx):
+    import random
+    conf    = ctx["dag_run"].conf or {}
+    dataset = conf.get("dataset", "Iris Flowers")
+    print(f"[drift_check] Running PSI & KS tests on {dataset} incoming data...")
+    drift_score    = round(random.uniform(0.03, 0.28), 4)
+    drift_detected = drift_score > 0.10
+    ctx["ti"].xcom_push(key="drift_score",    value=drift_score)
+    ctx["ti"].xcom_push(key="drift_detected", value=drift_detected)
+    status = "DRIFT DETECTED — retraining triggered" if drift_detected else "No significant drift"
+    print(f"[drift_check] PSI={drift_score}  {status}")
+def fetch_data(**ctx):
+    import random
+    ti            = ctx["ti"]
+    drift_score   = ti.xcom_pull(task_ids="drift_check", key="drift_score") or 0
+    n_new         = random.randint(150, 600)
+    ctx["ti"].xcom_push(key="n_new_samples", value=n_new)
+    print(f"[fetch_data] Fetching new labelled samples (drift_score={drift_score})")
+    print(f"[fetch_data] ✓ {n_new} new samples retrieved from data store")
+def merge(**ctx):
+    ti       = ctx["ti"]
+    n_new    = ti.xcom_pull(task_ids="fetch_data", key="n_new_samples") or 0
+    print(f"[merge] Merging {n_new} new samples with historical data")
+    print("[merge] ✓ Duplicate rows removed · class balance checked · dataset merged")
+def retrain(**ctx):
+    from mlops.datasets import DATASETS
+    from mlops.trainer import train_for_pipeline
+    conf      = ctx["dag_run"].conf or {}
+    dataset   = conf.get("dataset",   "Iris Flowers")
+    task_type = conf.get("task_type") or DATASETS.get(dataset, {}).get("task", "classification")
+    category  = conf.get("category",  "Tree-Based")
+    algorithm = conf.get("algorithm", "Random Forest")
+    run_id    = ctx["dag_run"].run_id[:12]
+    print(f"[retrain] Retraining champion: {algorithm} on {dataset}")
+    metrics = train_for_pipeline(dataset, task_type, category, algorithm,
+                                  experiment_name=f"retrain-{run_id}")
+    ctx["ti"].xcom_push(key="new_metrics",  value=metrics)
+    ctx["ti"].xcom_push(key="algorithm",    value=algorithm)
+    print(f"[retrain] ✓ New metrics: {metrics}")
+def ab_test(**ctx):
+    import random
+    ti        = ctx["ti"]
+    metrics   = ti.xcom_pull(task_ids="retrain", key="new_metrics") or {}
+    algo      = ti.xcom_pull(task_ids="retrain", key="algorithm")   or "?"
+    new_score = metrics.get("accuracy") or metrics.get("r2_score")  or 0.0
+    baseline  = round(random.uniform(0.82, 0.93), 4)
+    delta     = round(new_score - baseline, 4)
+    promote   = new_score > baseline
+    ctx["ti"].xcom_push(key="promote",   value=promote)
+    ctx["ti"].xcom_push(key="new_score", value=round(new_score, 4))
+    ctx["ti"].xcom_push(key="baseline",  value=baseline)
+    verdict = "PROMOTE challenger" if promote else "KEEP production model"
+    print(f"[ab_test] {algo}  baseline={baseline}  new={new_score:.4f}  Δ={delta:+.4f}  → {verdict}")
+def promote(**ctx):
+    ti        = ctx["ti"]
+    algo      = ti.xcom_pull(task_ids="retrain", key="algorithm")   or "?"
+    promote   = ti.xcom_pull(task_ids="ab_test", key="promote")
+    new_score = ti.xcom_pull(task_ids="ab_test", key="new_score")   or 0
+    baseline  = ti.xcom_pull(task_ids="ab_test", key="baseline")    or 0
+    if promote:
+        print(f"[promote] ✓ {algo} (score={new_score}) promoted to Production")
+        print(f"[promote] Previous production model (score={baseline}) archived")
+    else:
+        print(f"[promote] ✗ {algo} (score={new_score}) did not beat baseline ({baseline})")
+        print("[promote] Keeping current production model")
+with DAG(
+    dag_id       = "retraining_pipeline",
+    default_args = _DEFAULT_ARGS,
+    description  = "Drift detection → fetch new data → merge → retrain → A/B test → promote",
+    schedule     = None,
+    start_date   = datetime(2024, 1, 1),
+    catchup      = False,
+    tags         = ["automlops", "retraining"],
+) as dag:
+    t1 = PythonOperator(task_id="drift_check", python_callable=drift_check)
+    t2 = PythonOperator(task_id="fetch_data",  python_callable=fetch_data)
+    t3 = PythonOperator(task_id="merge",       python_callable=merge)
+    t4 = PythonOperator(task_id="retrain",     python_callable=retrain)
+    t5 = PythonOperator(task_id="ab_test",     python_callable=ab_test)
+    t6 = PythonOperator(task_id="promote",     python_callable=promote)
+    t1 >> t2 >> t3 >> t4 >> t5 >> t6

dags/training_pipeline.py ADDED Viewed

	@@ -0,0 +1,153 @@

+"""
+AutoMLOps Training Pipeline — Apache Airflow DAG
+Task IDs deliberately match pipelines/pipeline_defs.py so the frontend
+DAG graph and the Airflow execution share the same identifiers.
+  load_data → validate → preprocess → feat_eng
+                                         ↓
+                                       train
+                                         ↓
+                                      evaluate
+                                       ↙    ↘
+                                   report  register
+                                              ↓
+                                        deploy_staging
+"""
+import sys, os
+sys.path.insert(0, "/app")
+os.environ.setdefault("GIT_PYTHON_REFRESH", "quiet")
+from datetime import datetime, timedelta
+from airflow import DAG
+from airflow.operators.python import PythonOperator
+_DEFAULT_ARGS = {
+    "owner":            "automlops",
+    "retries":          1,
+    "retry_delay":      timedelta(seconds=20),
+    "email_on_failure": False,
+    "email_on_retry":   False,
+}
+# ── task callables ────────────────────────────────────────────────────────────
+def load_data(**ctx):
+    from mlops.datasets import load_dataset, DATASETS
+    conf    = ctx["dag_run"].conf or {}
+    dataset = conf.get("dataset", "Iris Flowers")
+    X_tr, X_te, y_tr, y_te, meta = load_dataset(dataset)
+    ctx["ti"].xcom_push(key="n_samples",  value=meta["n_samples"])
+    ctx["ti"].xcom_push(key="n_features", value=meta["n_features"])
+    ctx["ti"].xcom_push(key="task_type",  value=meta["task"])
+    print(f"[load_data] {dataset}: {meta['n_samples']} samples, {meta['n_features']} features, task={meta['task']}")
+def validate(**ctx):
+    ti       = ctx["ti"]
+    n        = ti.xcom_pull(task_ids="load_data", key="n_samples") or 0
+    n_feat   = ti.xcom_pull(task_ids="load_data", key="n_features") or 0
+    print(f"[validate] Checking {n} samples × {n_feat} features")
+    print("[validate] ✓ No nulls · Schema valid · Feature ranges in bounds")
+def preprocess(**ctx):
+    ti       = ctx["ti"]
+    n        = ti.xcom_pull(task_ids="load_data", key="n_samples") or 0
+    print(f"[preprocess] Applying StandardScaler to {n} samples")
+    print("[preprocess] ✓ StandardScaler fitted · 80/20 stratified train/test split applied")
+def feat_eng(**ctx):
+    ti     = ctx["ti"]
+    n_feat = ti.xcom_pull(task_ids="load_data", key="n_features") or 0
+    print(f"[feat_eng] Input features: {n_feat}")
+    print("[feat_eng] ✓ Feature selection complete · all features retained")
+    ctx["ti"].xcom_push(key="n_features_out", value=n_feat)
+def train(**ctx):
+    from mlops.datasets import DATASETS
+    from mlops.trainer import train_for_pipeline
+    conf      = ctx["dag_run"].conf or {}
+    dataset   = conf.get("dataset",   "Iris Flowers")
+    task_type = conf.get("task_type") or DATASETS.get(dataset, {}).get("task", "classification")
+    category  = conf.get("category",  "Tree-Based")
+    algorithm = conf.get("algorithm", "Random Forest")
+    run_id    = ctx["dag_run"].run_id[:12]
+    print(f"[train] Training {algorithm} ({category}) on {dataset}")
+    metrics = train_for_pipeline(dataset, task_type, category, algorithm,
+                                  experiment_name=f"pipeline-{run_id}")
+    ctx["ti"].xcom_push(key="metrics",   value=metrics)
+    ctx["ti"].xcom_push(key="algorithm", value=algorithm)
+    print(f"[train] ✓ Metrics: {metrics}")
+def evaluate(**ctx):
+    ti      = ctx["ti"]
+    metrics = ti.xcom_pull(task_ids="train", key="metrics") or {}
+    algo    = ti.xcom_pull(task_ids="train", key="algorithm") or "?"
+    primary = metrics.get("accuracy") or metrics.get("r2_score") or 0.0
+    print(f"[evaluate] {algo}  primary_metric={primary:.4f}  all={metrics}")
+    if primary < 0.3:
+        raise ValueError(f"Model quality below threshold ({primary:.4f} < 0.3)")
+    ctx["ti"].xcom_push(key="primary_metric", value=round(primary, 4))
+    ctx["ti"].xcom_push(key="approved",       value=True)
+def report(**ctx):
+    ti      = ctx["ti"]
+    metrics = ti.xcom_pull(task_ids="train",    key="metrics")        or {}
+    pm      = ti.xcom_pull(task_ids="evaluate", key="primary_metric") or 0
+    print(f"[report] Generating evaluation report  primary={pm}")
+    print(f"[report] Full metrics: {metrics}")
+    print("[report] ✓ HTML report generated · metrics written to MLflow")
+def register(**ctx):
+    ti       = ctx["ti"]
+    algo     = ti.xcom_pull(task_ids="train",    key="algorithm")     or "?"
+    pm       = ti.xcom_pull(task_ids="evaluate", key="primary_metric") or 0
+    approved = ti.xcom_pull(task_ids="evaluate", key="approved")
+    if not approved:
+        print("[register] Model not approved — skipping registry push")
+        return
+    print(f"[register] Registering {algo} (score={pm}) in MLflow Model Registry")
+    print("[register] ✓ Model artifact registered · version tagged as Staging candidate")
+def deploy_staging(**ctx):
+    ti   = ctx["ti"]
+    algo = ti.xcom_pull(task_ids="train",    key="algorithm")      or "?"
+    pm   = ti.xcom_pull(task_ids="evaluate", key="primary_metric") or 0
+    print(f"[deploy_staging] Promoting {algo} (score={pm}) to Staging")
+    print("[deploy_staging] ✓ Model transitioned to Staging · REST endpoint ready")
+# ── DAG wiring ────────────────────────────────────────────────────────────────
+with DAG(
+    dag_id       = "training_pipeline",
+    default_args = _DEFAULT_ARGS,
+    description  = "End-to-end ML training: load → validate → preprocess → train → evaluate → register → deploy",
+    schedule     = None,
+    start_date   = datetime(2024, 1, 1),
+    catchup      = False,
+    tags         = ["automlops", "training"],
+) as dag:
+    t_load     = PythonOperator(task_id="load_data",      python_callable=load_data)
+    t_validate = PythonOperator(task_id="validate",       python_callable=validate)
+    t_preproc  = PythonOperator(task_id="preprocess",     python_callable=preprocess)
+    t_feat     = PythonOperator(task_id="feat_eng",       python_callable=feat_eng)
+    t_train    = PythonOperator(task_id="train",          python_callable=train)
+    t_eval     = PythonOperator(task_id="evaluate",       python_callable=evaluate)
+    t_report   = PythonOperator(task_id="report",         python_callable=report)
+    t_register = PythonOperator(task_id="register",       python_callable=register)
+    t_deploy   = PythonOperator(task_id="deploy_staging", python_callable=deploy_staging)
+    t_load >> t_validate >> t_preproc >> t_feat >> t_train >> t_eval
+    t_eval >> t_report
+    t_eval >> t_register >> t_deploy

mlops/airflow_runner.py ADDED Viewed

	@@ -0,0 +1,225 @@

+"""
+Airflow execution bridge for AutoMLOps.
+Triggers a real Airflow DAG run, then watches Airflow's metadata DB for
+task-state changes and mirrors them into the same ``pipeline_executions``
+dict that the existing ``/api/pipeline/status/<exec_id>`` endpoint reads.
+The frontend never needs to know Airflow is running — it polls the same
+Flask status endpoint it always did.
+"""
+from __future__ import annotations
+import uuid, time, threading, logging
+from datetime import datetime
+from pipelines.dag_engine import pipeline_executions, _lock
+logger = logging.getLogger(__name__)
+# Maps Airflow task states → the three states the frontend understands
+_AF_STATE: dict[str | None, str] = {
+    None:              "pending",
+    "queued":          "pending",
+    "scheduled":       "pending",
+    "deferred":        "pending",
+    "running":         "running",
+    "success":         "success",
+    "skipped":         "success",
+    "failed":          "failed",
+    "upstream_failed": "failed",
+    "removed":         "failed",
+}
+def _fe_state(af: str | None) -> str:
+    return _AF_STATE.get(af, "pending")
+# ── watcher thread ────────────────────────────────────────────────────────────
+def _watch(exec_id: str, dag_id: str, run_id: str, task_ids: list[str], task_names: dict[str, str]):
+    """
+    Polls the Airflow metadata DB and pushes updates into pipeline_executions.
+    Exits when the DAG run reaches a terminal state (success / failed).
+    """
+    try:
+        from airflow.models import DagRun, TaskInstance
+        from airflow.utils.session import create_session
+    except ImportError:
+        logger.error("Airflow is not installed — watcher thread cannot run")
+        with _lock:
+            if exec_id in pipeline_executions:
+                pipeline_executions[exec_id]["status"] = "failed"
+                pipeline_executions[exec_id]["error"]  = "Airflow not installed"
+        return
+    seen_states: dict[str, str] = {tid: "pending" for tid in task_ids}
+    for _attempt in range(600):   # max ~10 min of polling
+        time.sleep(1.5)
+        try:
+            with create_session() as session:
+                dag_run = session.query(DagRun).filter(
+                    DagRun.dag_id == dag_id,
+                    DagRun.run_id == run_id,
+                ).first()
+                if dag_run is None:
+                    continue          # scheduler hasn't picked it up yet
+                tis = {
+                    ti.task_id: ti
+                    for ti in session.query(TaskInstance).filter(
+                        TaskInstance.dag_id == dag_id,
+                        TaskInstance.run_id == run_id,
+                    ).all()
+                }
+            now       = datetime.utcnow().strftime("%H:%M:%S")
+            done_cnt  = 0
+            with _lock:
+                exec_st = pipeline_executions.get(exec_id)
+                if exec_st is None:
+                    return
+                for tid in task_ids:
+                    ti    = tis.get(tid)
+                    af_st = ti.state if ti else None
+                    fe_st = _fe_state(af_st)
+                    prev  = seen_states[tid]
+                    if fe_st == prev:
+                        if fe_st in ("success", "failed"):
+                            done_cnt += 1
+                        continue
+                    seen_states[tid] = fe_st
+                    name = task_names.get(tid, tid)
+                    if fe_st == "running":
+                        exec_st["task_states"][tid]["status"]     = "running"
+                        exec_st["task_states"][tid]["started_at"] = (
+                            ti.start_date.isoformat() if ti and ti.start_date else None
+                        )
+                        exec_st["logs"].append(f"[{now}] ▶  {name}")
+                    elif fe_st == "success":
+                        dur = round(ti.duration, 1) if ti and ti.duration else 0
+                        exec_st["task_states"][tid]["status"]      = "success"
+                        exec_st["task_states"][tid]["result"]      = f"Completed in {dur}s"
+                        exec_st["task_states"][tid]["finished_at"] = (
+                            ti.end_date.isoformat() if ti and ti.end_date else None
+                        )
+                        exec_st["logs"].append(f"[{now}] ✔  {name} — {dur}s")
+                        done_cnt += 1
+                    elif fe_st == "failed":
+                        exec_st["task_states"][tid]["status"]      = "failed"
+                        exec_st["task_states"][tid]["error"]       = "Task failed in Airflow"
+                        exec_st["task_states"][tid]["finished_at"] = (
+                            ti.end_date.isoformat() if ti and ti.end_date else None
+                        )
+                        exec_st["logs"].append(f"[{now}] ✖  {name} — failed")
+                        done_cnt += 1
+                total = len(task_ids) or 1
+                exec_st["progress"] = int(100 * done_cnt / total)
+                exec_st["status"]   = "running"
+            # Check terminal state of the whole DAG run
+            dag_state = str(dag_run.state) if dag_run else "running"
+            if dag_state == "success":
+                with _lock:
+                    if exec_id in pipeline_executions:
+                        pipeline_executions[exec_id]["status"]       = "completed"
+                        pipeline_executions[exec_id]["progress"]     = 100
+                        pipeline_executions[exec_id]["completed_at"] = datetime.utcnow().isoformat()
+                        pipeline_executions[exec_id]["logs"].append(
+                            f"[{now}] ✔  DAG '{dag_id}' completed successfully"
+                        )
+                return
+            elif dag_state in ("failed", "upstream_failed"):
+                with _lock:
+                    if exec_id in pipeline_executions:
+                        pipeline_executions[exec_id]["status"] = "failed"
+                        pipeline_executions[exec_id]["error"]  = "DAG run failed in Airflow"
+                        pipeline_executions[exec_id]["logs"].append(
+                            f"[{now}] ✖  DAG '{dag_id}' failed"
+                        )
+                return
+        except Exception as exc:
+            logger.warning(f"[watcher] poll error: {exc}")
+    # Timed out
+    with _lock:
+        if exec_id in pipeline_executions:
+            pipeline_executions[exec_id]["status"] = "failed"
+            pipeline_executions[exec_id]["error"]  = "Execution watcher timed out"
+# ── public API ────────────────────────────────────────────────────────────────
+def trigger_pipeline(pipeline_id: str, context: dict | None = None, dag=None) -> str:
+    """
+    Trigger an Airflow DAG run and return an exec_id compatible with the
+    existing pipeline_executions / status endpoint contract.
+    ``dag`` is the DAG object from pipeline_defs.py (used for task metadata).
+    """
+    from airflow.api.common.trigger_dag import trigger_dag as af_trigger
+    ts      = datetime.utcnow().strftime("%Y%m%dT%H%M%S")
+    run_id  = f"automlops__{ts}"
+    exec_id = str(uuid.uuid4())[:8]
+    dag_id = pipeline_id   # our pipeline IDs match Airflow DAG IDs exactly
+    # Fire the Airflow DAG run
+    af_trigger(dag_id=dag_id, run_id=run_id, conf=context or {}, replace_microseconds=False)
+    # Collect task metadata from the pipeline_defs DAG object
+    task_ids   = list(dag.tasks.keys())   if dag else []
+    task_names = {tid: dag.tasks[tid].name for tid in task_ids} if dag else {}
+    # Initialise exec state (same schema as dag_engine.execute_dag)
+    task_states = {
+        tid: {"status": "pending", "started_at": None,
+              "finished_at": None, "result": None, "error": None}
+        for tid in task_ids
+    }
+    now = datetime.utcnow().strftime("%H:%M:%S")
+    with _lock:
+        pipeline_executions[exec_id] = {
+            "exec_id":     exec_id,
+            "dag_id":      dag_id,
+            "run_id":      run_id,
+            "dag_name":    dag.name if dag else dag_id,
+            "status":      "queued",
+            "progress":    0,
+            "task_states": task_states,
+            "logs": [f"[{now}] DAG '{dag_id}' triggered in Apache Airflow  (run_id={run_id})"],
+            "created_at":  datetime.utcnow().isoformat(),
+        }
+    # Start the watcher thread
+    threading.Thread(
+        target=_watch,
+        args=(exec_id, dag_id, run_id, task_ids, task_names),
+        daemon=True,
+    ).start()
+    return exec_id
+def is_available() -> bool:
+    """Return True if Airflow is installed and the scheduler DB is reachable."""
+    try:
+        from airflow.utils.session import create_session
+        with create_session():
+            pass
+        return True
+    except Exception:
+        return False

mlops/trainer.py CHANGED Viewed

@@ -1,10 +1,14 @@
 """Background model trainer with MLflow tracking."""
 import time
 import uuid
 import threading
 import numpy as np
 from datetime import datetime
 import mlflow
 import mlflow.sklearn
 from sklearn.preprocessing import StandardScaler, LabelEncoder
@@ -26,7 +30,7 @@ _lock = threading.Lock()
 # ── Internal helpers ──────────────────────────────────────────────────────────
 def _get_or_create_experiment(name: str) -> str:
-    mlflow.set_tracking_uri("sqlite:///mlflow.db")
     exp = mlflow.get_experiment_by_name(name)
     if exp is None:
         return mlflow.create_experiment(name)
@@ -65,7 +69,7 @@ def _do_train(job_id: str, dataset_name: str, algorithm_name: str,
     start_time = time.time()
     try:
         _update_job(training_jobs, job_id, status="running", progress=5)
-        mlflow.set_tracking_uri("sqlite:///mlflow.db")
         # 1. Load data
         X_train, X_test, y_train, y_test, meta = load_dataset(dataset_name)
@@ -176,7 +180,7 @@ def _do_automl(job_id: str, dataset_name: str, task_type: str,
     """Run every algorithm for the chosen task and log the best."""
     try:
         _update_job(automl_jobs, job_id, status="running", progress=2)
-        mlflow.set_tracking_uri("sqlite:///mlflow.db")
         X_train, X_test, y_train, y_test, meta = load_dataset(dataset_name)
         _update_job(automl_jobs, job_id, dataset_meta=meta, progress=5)
@@ -265,6 +269,50 @@ def _do_automl(job_id: str, dataset_name: str, task_type: str,
         _update_job(automl_jobs, job_id, status="failed", error=str(exc))
 def start_automl(dataset_name: str, task_type: str,
                  optimize_metric: str = "accuracy",
                  max_runs: int = 20) -> str:

 """Background model trainer with MLflow tracking."""
+import os
 import time
 import uuid
 import threading
 import numpy as np
 from datetime import datetime
+# Allow override via env var so Airflow tasks (different CWD) hit the same DB
+_MLFLOW_URI = os.environ.get("MLFLOW_TRACKING_URI", "sqlite:///mlflow.db")
 import mlflow
 import mlflow.sklearn
 from sklearn.preprocessing import StandardScaler, LabelEncoder
 # ── Internal helpers ──────────────────────────────────────────────────────────
 def _get_or_create_experiment(name: str) -> str:
+    mlflow.set_tracking_uri(_MLFLOW_URI)
     exp = mlflow.get_experiment_by_name(name)
     if exp is None:
         return mlflow.create_experiment(name)
     start_time = time.time()
     try:
         _update_job(training_jobs, job_id, status="running", progress=5)
+        mlflow.set_tracking_uri(_MLFLOW_URI)
         # 1. Load data
         X_train, X_test, y_train, y_test, meta = load_dataset(dataset_name)
     """Run every algorithm for the chosen task and log the best."""
     try:
         _update_job(automl_jobs, job_id, status="running", progress=2)
+        mlflow.set_tracking_uri(_MLFLOW_URI)
         X_train, X_test, y_train, y_test, meta = load_dataset(dataset_name)
         _update_job(automl_jobs, job_id, dataset_meta=meta, progress=5)
         _update_job(automl_jobs, job_id, status="failed", error=str(exc))
+def train_for_pipeline(dataset_name: str, task_type: str, category: str,
+                       algorithm: str, experiment_name: str = "pipeline") -> dict:
+    """
+    Synchronous training helper used by Airflow pipeline tasks.
+    Runs the full train/eval loop and returns a metrics dict.
+    Raises RuntimeError if training fails.
+    """
+    from sklearn.preprocessing import StandardScaler, MinMaxScaler
+    mlflow.set_tracking_uri(_MLFLOW_URI)
+    X_train, X_test, y_train, y_test, _ = load_dataset(dataset_name)
+    algo_cfg = get_algorithm(task_type, category, algorithm)
+    params   = algo_cfg["params"]
+    if "Naive Bayes" in algorithm or "Complement" in algorithm:
+        scaler = MinMaxScaler()
+    else:
+        scaler = StandardScaler()
+    X_tr = scaler.fit_transform(X_train)
+    X_te = scaler.transform(X_test)
+    exp_id = _get_or_create_experiment(experiment_name)
+    with mlflow.start_run(experiment_id=exp_id,
+                          run_name=f"{algorithm} — {dataset_name}") as run:
+        mlflow.set_tags({
+            "algorithm": algorithm, "category": category,
+            "dataset": dataset_name, "source": "airflow_pipeline",
+        })
+        mlflow.log_params({"algorithm": algorithm, "category": category,
+                           "dataset": dataset_name})
+        model = algo_cfg["class"](**params)
+        model.fit(X_tr, y_train)
+        y_pred = model.predict(X_te)
+        if task_type == "classification":
+            metrics = _classification_metrics(y_test, y_pred)
+        else:
+            metrics = _regression_metrics(y_test, y_pred)
+        mlflow.log_metrics(metrics)
+        mlflow.sklearn.log_model(model, "model")
+    return metrics
 def start_automl(dataset_name: str, task_type: str,
                  optimize_metric: str = "accuracy",
                  max_runs: int = 20) -> str:

start.sh ADDED Viewed

	@@ -0,0 +1,24 @@

+#!/bin/bash
+# AutoMLOps startup — launches Airflow scheduler then the Flask app
+set -e
+echo "===== AutoMLOps Startup at $(date -u '+%Y-%m-%d %H:%M:%S') ====="
+# ── Airflow scheduler ─────────────────────────────────────────────────────────
+echo "[startup] Starting Apache Airflow scheduler..."
+airflow scheduler &
+SCHEDULER_PID=$!
+echo "[startup] Scheduler PID: ${SCHEDULER_PID}"
+# Brief pause so the scheduler can parse DAGs before first web request
+sleep 4
+# ── Flask application ─────────────────────────────────────────────────────────
+echo "[startup] Starting Flask application on :7860..."
+exec gunicorn app:app \
+    --bind 0.0.0.0:7860 \
+    --workers 1 \
+    --threads 4 \
+    --worker-class gthread \
+    --timeout 300 \
+    --log-level info

templates/base.html CHANGED Viewed

@@ -52,7 +52,7 @@
     <div class="nav-section-label">Operations</div>
     <a href="/pipeline" class="nav-item {% if active_page == 'pipeline' %}active{% endif %}">
-      <span class="nav-icon"><i class="fa-solid fa-diagram-project"></i></span> Pipelines
     </a>
     <a href="/models" class="nav-item {% if active_page == 'models' %}active{% endif %}">
       <span class="nav-icon"><i class="fa-solid fa-box-archive"></i></span> Model Registry

     <div class="nav-section-label">Operations</div>
     <a href="/pipeline" class="nav-item {% if active_page == 'pipeline' %}active{% endif %}">
+      <span class="nav-icon"><i class="fa-solid fa-diagram-project"></i></span> Pipeline Studio
     </a>
     <a href="/models" class="nav-item {% if active_page == 'models' %}active{% endif %}">
       <span class="nav-icon"><i class="fa-solid fa-box-archive"></i></span> Model Registry

templates/pipeline.html CHANGED Viewed

@@ -1,295 +1,701 @@
 {% extends "base.html" %}
 {% set active_page = "pipeline" %}
-{% block title %}Pipelines{% endblock %}
-{% block page_title %}<i class="fa-solid fa-diagram-project" style="color:var(--cyan)"></i> Pipelines{% endblock %}
 {% block content %}
-<div class="page-title">Pipeline Orchestration</div>
-<div class="page-sub">Airflow-style DAG visualisation and execution — click any pipeline to inspect and run</div>
-<!-- Pipeline selector tabs -->
-<div class="tab-bar" id="pipeline-tabs">
-  <button class="tab-btn active" onclick="switchPipeline('training_pipeline', this)">
-    <i class="fa-solid fa-brain"></i> Training Pipeline
-  </button>
-  <button class="tab-btn" onclick="switchPipeline('retraining_pipeline', this)">
-    <i class="fa-solid fa-rotate"></i> Retraining Pipeline
-  </button>
-  <button class="tab-btn" onclick="switchPipeline('data_pipeline', this)">
-    <i class="fa-solid fa-database"></i> Data Pipeline
-  </button>
-</div>
-<!-- Pipeline description + run button -->
-<div class="card mb-20" style="margin-bottom:16px">
-  <div class="flex-between">
-    <div>
-      <div class="card-title" id="pipeline-name" style="font-size:1rem;margin-bottom:4px">Training Pipeline</div>
-      <div id="pipeline-desc" style="font-size:.85rem;color:var(--text-secondary)">
-        End-to-end model training: ingest → preprocess → train → evaluate → register
-      </div>
-    </div>
-    <div class="flex-gap">
-      <!-- Context form for training pipeline -->
-      <div id="ctx-form" style="display:flex;gap:8px;flex-wrap:wrap">
-        <select class="form-select" id="ctx-dataset" style="width:auto;padding:6px 28px 6px 10px;font-size:.82rem">
-          {% for name in datasets %}<option>{{ name }}</option>{% endfor %}
-        </select>
-      </div>
-      <button class="btn btn-primary" id="btn-run-pipeline" onclick="runPipeline()">
-        <i class="fa-solid fa-play"></i> Execute DAG
       </button>
     </div>
-  </div>
-</div>
-<!-- DAG canvas -->
-<div class="card mb-20" style="margin-bottom:16px">
-  <div class="card-header">
-    <div class="card-title"><i class="fa-solid fa-sitemap" style="color:var(--accent)"></i> DAG Graph</div>
-    <span id="exec-status-badge"></span>
   </div>
-  <div id="dag-canvas" class="dag-canvas" style="height:320px"></div>
-</div>
-<!-- Execution state grid + log -->
-<div class="grid-2">
-  <div class="card">
-    <div class="card-header">
-      <div class="card-title"><i class="fa-solid fa-list-check" style="color:var(--success)"></i> Task Status</div>
-      <div id="exec-progress-wrap" style="display:flex;align-items:center;gap:8px;font-size:.82rem;color:var(--text-muted)">
-        <span id="exec-pct">—</span>
       </div>
     </div>
-    <div id="task-list" style="display:flex;flex-direction:column;gap:6px"></div>
   </div>
-  <div class="card">
-    <div class="card-header">
-      <div class="card-title"><i class="fa-solid fa-terminal" style="color:var(--warning)"></i> Execution Log</div>
-      <button class="btn btn-ghost btn-sm" onclick="clearLog()"><i class="fa-solid fa-trash"></i></button>
     </div>
-    <div class="pipeline-log" id="exec-log">Waiting for execution…</div>
   </div>
 </div>
 {% endblock %}
 {% block scripts %}
 <script>
-const DAGS = {{ dags | safe }};
-let currentPipeline = 'training_pipeline';
-let currentExecId   = null;
-let pollIv          = null;
-let currentDag      = null;
-const STATUS_COLORS = {
-  pending: '#30363d', running: '#f59e0b', success: '#22c55e', failed: '#ef4444',
-};
-const STATUS_ICONS = {
-  pending: '⏳', running: '⚡', success: '✅', failed: '❌',
 };
-// ── Init ─────────────────────────────────────────────────────────────────────
-document.addEventListener('DOMContentLoaded', () => {
-  switchPipeline('training_pipeline',
-    document.querySelector('.tab-btn.active'));
-});
 function switchPipeline(id, btn) {
-  currentPipeline = id;
-  currentExecId   = null;
   if (pollIv) { clearInterval(pollIv); pollIv = null; }
-  document.querySelectorAll('.tab-btn').forEach(b => b.classList.remove('active'));
   btn.classList.add('active');
-  const dag = DAGS[id];
-  currentDag = dag;
-  document.getElementById('pipeline-name').textContent = dag.name;
-  document.getElementById('pipeline-desc').textContent = dag.description;
-  // Show dataset selector only for training pipeline
-  document.getElementById('ctx-form').style.display =
-    id === 'training_pipeline' ? 'flex' : 'none';
-  renderDAG(dag);
-  renderTaskList(dag, {});
-  document.getElementById('exec-log').textContent = 'Waiting for execution…';
-  document.getElementById('exec-status-badge').innerHTML = '';
-  document.getElementById('exec-pct').textContent = '—';
-  document.getElementById('btn-run-pipeline').disabled = false;
-  document.getElementById('btn-run-pipeline').innerHTML = '<i class="fa-solid fa-play"></i> Execute DAG';
-}
-// ── DAG rendering with Plotly ─────────────────────────────────────────────────
-function renderDAG(dag, taskStates) {
-  taskStates = taskStates || {};
-  const tasks   = Object.values(dag.tasks);
-  const layers  = {};
-  tasks.forEach(t => { layers[t.layer] = (layers[t.layer] || []); layers[t.layer].push(t); });
-  const nodeX = {}, nodeY = {};
-  const maxLayer = Math.max(...tasks.map(t => t.layer));
-  const xStep = 1 / (maxLayer + 1);
-  Object.entries(layers).forEach(([layer, ts]) => {
-    const xPos = (parseInt(layer) + 0.5) * xStep;
-    const yStep = 1 / (ts.length + 1);
-    ts.forEach((t, i) => {
-      nodeX[t.task_id] = xPos;
-      nodeY[t.task_id] = (i + 1) * yStep;
-    });
   });
-  // Build edge traces
-  const edgeTraces = [];
   tasks.forEach(t => {
-    t.upstream.forEach(upId => {
-      if (!nodeX[upId]) return;
-      edgeTraces.push({
-        type: 'scatter', mode: 'lines',
-        x: [nodeX[upId], nodeX[t.task_id]],
-        y: [nodeY[upId], nodeY[t.task_id]],
-        line: { color: '#30363d', width: 2 },
-        hoverinfo: 'none', showlegend: false,
-      });
-    });
   });
-  // Node trace
-  const nodeColors = tasks.map(t => {
-    const st = (taskStates[t.task_id] || {}).status || 'pending';
-    return STATUS_COLORS[st] || '#30363d';
-  });
-  const nodeText = tasks.map(t => {
-    const st = (taskStates[t.task_id] || {}).status || 'pending';
-    return `${t.icon} ${t.name}<br><span style="font-size:10px">${STATUS_ICONS[st]} ${st}</span>`;
-  });
-  const nodeHover = tasks.map(t => {
-    const st = (taskStates[t.task_id] || {}).status || 'pending';
-    return `<b>${t.name}</b><br>${t.description}<br>Status: ${st}`;
   });
-  const nodeTrace = {
-    type: 'scatter', mode: 'markers+text',
-    x: tasks.map(t => nodeX[t.task_id]),
-    y: tasks.map(t => nodeY[t.task_id]),
-    text: nodeText,
-    textposition: 'bottom center',
-    textfont: { color: '#e6edf3', size: 11 },
-    marker: {
-      size: 36,
-      color: nodeColors,
-      line: { color: '#e6edf3', width: 1.5 },
-      symbol: 'circle',
-    },
-    hovertemplate: nodeHover.map(h => h + '<extra></extra>'),
-    showlegend: false,
-  };
-  const bg = '#0d1117';
-  Plotly.react('dag-canvas', [...edgeTraces, nodeTrace], {
-    paper_bgcolor: bg, plot_bgcolor: bg,
-    margin: { t: 20, b: 40, l: 20, r: 20 },
-    xaxis: { showgrid: false, zeroline: false, showticklabels: false, range: [0,1] },
-    yaxis: { showgrid: false, zeroline: false, showticklabels: false, range: [0,1] },
-    dragmode: false,
-  }, { responsive: true, displayModeBar: false });
-}
-// ── Task status list ──────────────────────────────────────────────────────────
-function renderTaskList(dag, taskStates) {
-  const tasks = Object.values(dag.tasks).sort((a,b) => a.layer - b.layer);
-  const el = document.getElementById('task-list');
-  el.innerHTML = tasks.map(t => {
-    const st  = (taskStates[t.task_id] || {}).status || 'pending';
-    const res = (taskStates[t.task_id] || {}).result || '';
-    const clr = STATUS_COLORS[st] || '#30363d';
-    return `<div style="display:flex;align-items:flex-start;gap:10px;padding:8px 10px;border-radius:6px;background:var(--bg-tertiary)">
-      <div style="width:10px;height:10px;border-radius:50%;background:${clr};margin-top:4px;flex-shrink:0"></div>
-      <div style="flex:1;min-width:0">
-        <div style="font-size:.85rem;font-weight:500">${t.icon} ${t.name}</div>
-        ${res ? `<div style="font-size:.75rem;color:var(--text-muted);margin-top:2px;overflow:hidden;text-overflow:ellipsis;white-space:nowrap" title="${res}">${res}</div>` : ''}
       </div>
-      <span style="font-size:.72rem;padding:2px 7px;border-radius:10px;background:${clr}22;color:${clr};white-space:nowrap">${STATUS_ICONS[st]} ${st}</span>
-    </div>`;
-  }).join('');
 }
 // ── Execute pipeline ──────────────────────────────────────────────────────────
 async function runPipeline() {
-  document.getElementById('btn-run-pipeline').disabled = true;
-  document.getElementById('btn-run-pipeline').innerHTML = '<span class="spinner"></span> Running…';
-  document.getElementById('exec-log').textContent = '';
-  document.getElementById('exec-status-badge').innerHTML =
-    '<span class="badge badge-warning"><span class="spinner" style="width:9px;height:9px;border-width:1.5px"></span> Running</span>';
   const ctx = {};
-  if (currentPipeline === 'training_pipeline') {
-    ctx.dataset = document.getElementById('ctx-dataset').value;
   }
   try {
-    const res  = await fetch(`/api/pipeline/${currentPipeline}/execute`, {
-      method: 'POST', headers:{'Content-Type':'application/json'},
       body: JSON.stringify(ctx),
     });
-    const data = await res.json();
-    currentExecId = data.exec_id;
-    pollExecution();
-  } catch(e) {
-    showToast('Failed to start pipeline', 'error');
-    document.getElementById('btn-run-pipeline').disabled = false;
-    document.getElementById('btn-run-pipeline').innerHTML = '<i class="fa-solid fa-play"></i> Execute DAG';
-  }
 }
-function pollExecution() {
   if (pollIv) clearInterval(pollIv);
   pollIv = setInterval(async () => {
-    const res  = await fetch(`/api/pipeline/status/${currentExecId}`);
-    const exec = await res.json();
-    // Update progress
-    document.getElementById('exec-pct').textContent = exec.progress + '%';
-    // Update log
-    const logEl = document.getElementById('exec-log');
-    logEl.innerHTML = (exec.logs || []).map(line => {
-      let cls = '';
-      if (line.includes('✔')) cls = 'log-line-ok';
-      else if (line.includes('✖')) cls = 'log-line-err';
-      else if (line.includes('▶')) cls = 'log-line-info';
-      return `<div class="${cls}">${line}</div>`;
-    }).join('');
-    logEl.scrollTop = logEl.scrollHeight;
-    // Update DAG
-    if (exec.task_states) {
-      renderDAG(currentDag, exec.task_states);
-      renderTaskList(currentDag, exec.task_states);
-    }
-    if (exec.status === 'completed') {
-      clearInterval(pollIv); pollIv = null;
-      document.getElementById('exec-status-badge').innerHTML =
-        '<span class="badge badge-success"><i class="fa-solid fa-check"></i> Completed</span>';
-      document.getElementById('btn-run-pipeline').disabled = false;
-      document.getElementById('btn-run-pipeline').innerHTML = '<i class="fa-solid fa-rotate-right"></i> Run Again';
-      showToast(`Pipeline "${currentDag.name}" completed`, 'success');
-    } else if (exec.status === 'failed') {
-      clearInterval(pollIv); pollIv = null;
-      document.getElementById('exec-status-badge').innerHTML =
-        '<span class="badge badge-danger"><i class="fa-solid fa-xmark"></i> Failed</span>';
-      document.getElementById('btn-run-pipeline').disabled = false;
-      document.getElementById('btn-run-pipeline').innerHTML = '<i class="fa-solid fa-play"></i> Retry';
-      showToast('Pipeline failed: ' + (exec.error || 'unknown'), 'error');
-    }
-  }, 800);
-}
-function clearLog() { document.getElementById('exec-log').textContent = 'Cleared.'; }
 </script>
 {% endblock %}

 {% extends "base.html" %}
 {% set active_page = "pipeline" %}
+{% block title %}Pipeline Studio{% endblock %}
+{% block page_title %}<i class="fa-solid fa-diagram-project" style="color:var(--cyan)"></i> Pipeline Studio{% endblock %}
+{% block head_extra %}
+<style>
+/* ── Override page padding so studio fills the viewport ─────────────────── */
+.page-content { padding: 0 !important; overflow: hidden; height: calc(100vh - var(--navbar-h)); }
+.main { overflow: hidden; }
+/* ── Studio shell ─────────────────────────────────────────────────────────── */
+.ps { display: flex; flex-direction: column; height: 100%; overflow: hidden; }
+/* ── Toolbar ─────────────────────────────────────────────────────────────── */
+.ps-toolbar {
+  display: flex; align-items: center; gap: 10px; flex-wrap: wrap;
+  padding: 0 16px; min-height: 52px; flex-shrink: 0;
+  background: var(--bg-secondary);
+  border-bottom: 1px solid var(--border-color);
+}
+.ps-tabs { display: flex; gap: 3px; }
+.ps-tab {
+  display: flex; align-items: center; gap: 6px;
+  padding: 5px 13px; border-radius: 6px;
+  font-size: .8rem; font-weight: 500;
+  background: transparent; border: 1px solid transparent;
+  color: var(--text-secondary); cursor: pointer;
+  transition: background .13s, color .13s, border-color .13s;
+}
+.ps-tab:hover  { background: var(--bg-tertiary); color: var(--text-primary); }
+.ps-tab.active { background: rgba(139,92,246,.12); border-color: rgba(139,92,246,.3); color: var(--accent-light); }
+.ps-info { flex: 1; min-width: 0; padding: 0 12px; }
+.ps-name { font-size: .88rem; font-weight: 600; white-space: nowrap; overflow: hidden; text-overflow: ellipsis; }
+.ps-desc { font-size: .74rem; color: var(--text-secondary); white-space: nowrap; overflow: hidden; text-overflow: ellipsis; margin-top: 1px; }
+.ps-badge {
+  display: inline-flex; align-items: center; gap: 5px; flex-shrink: 0;
+  padding: 3px 10px; border-radius: 20px; font-size: .72rem; font-weight: 600;
+}
+.ps-badge.idle    { background: var(--bg-tertiary); color: var(--text-muted); }
+.ps-badge.running { background: rgba(245,158,11,.12); color: var(--warning); }
+.ps-badge.success { background: rgba(34,197,94,.12); color: var(--success); }
+.ps-badge.failed  { background: rgba(239,68,68,.12); color: var(--danger); }
+.ps-run-btn {
+  display: flex; align-items: center; gap: 7px; flex-shrink: 0;
+  padding: 6px 16px; border: none; border-radius: 6px;
+  background: linear-gradient(135deg, var(--accent) 0%, var(--accent-blue) 100%);
+  color: #fff; font-size: .83rem; font-weight: 600;
+  cursor: pointer; transition: opacity .15s, transform .1s;
+}
+.ps-run-btn:hover:not(:disabled) { opacity: .88; }
+.ps-run-btn:active:not(:disabled) { transform: scale(.96); }
+.ps-run-btn:disabled { opacity: .45; cursor: default; }
+/* ── Main area (canvas + config panel) ───────────────────────────────────── */
+.ps-main { flex: 1; display: flex; overflow: hidden; }
+/* DAG canvas */
+.ps-canvas {
+  flex: 1; overflow: auto; position: relative;
+  background-color: var(--bg-primary);
+  background-image: radial-gradient(circle, var(--border-color) 1px, transparent 1px);
+  background-size: 28px 28px;
+}
+.ps-canvas-inner { position: relative; }
+.dag-arrows { position: absolute; top: 0; left: 0; pointer-events: none; z-index: 5; overflow: visible; }
+/* ── DAG nodes ────────────────────────────────────────────────────────────── */
+.dag-node {
+  position: absolute;
+  background: var(--bg-secondary);
+  border: 1.5px solid var(--border-color);
+  border-radius: 10px;
+  padding: 10px 11px 8px;
+  cursor: pointer;
+  transition: border-color .18s, box-shadow .18s, transform .12s;
+  user-select: none; z-index: 10;
+}
+.dag-node:hover {
+  border-color: var(--accent-light);
+  box-shadow: 0 0 0 3px rgba(139,92,246,.15), 0 4px 14px rgba(0,0,0,.3);
+  transform: translateY(-1px);
+}
+.dag-node.selected { border-color: var(--accent); box-shadow: 0 0 0 3px rgba(139,92,246,.25); }
+.dag-node.s-running { border-color: var(--warning); animation: node-pulse 1.6s ease-in-out infinite; }
+.dag-node.s-success { border-color: var(--success); box-shadow: 0 0 0 2px rgba(34,197,94,.2); }
+.dag-node.s-failed  { border-color: var(--danger);  box-shadow: 0 0 0 2px rgba(239,68,68,.2); }
+@keyframes node-pulse {
+  0%, 100% { box-shadow: 0 0 0 2px rgba(245,158,11,.2); }
+  50%       { box-shadow: 0 0 0 8px rgba(245,158,11,.04); }
+}
+/* Purple dot = configurable */
+.dag-node.configurable::after {
+  content: ''; position: absolute; top: 7px; right: 7px;
+  width: 5px; height: 5px; border-radius: 50%; background: var(--accent);
+}
+.nd-icon  { font-size: 1.1rem; display: block; line-height: 1; margin-bottom: 3px; }
+.nd-name  { font-size: .77rem; font-weight: 600; color: var(--text-primary); white-space: nowrap; overflow: hidden; text-overflow: ellipsis; }
+.nd-badge {
+  display: inline-flex; align-items: center; gap: 4px;
+  margin-top: 5px; padding: 2px 6px; border-radius: 8px;
+  font-size: .66rem; font-weight: 500;
+}
+.nd-badge.pending { background: rgba(101,109,118,.15); color: var(--text-muted); }
+.nd-badge.running { background: rgba(245,158,11,.14); color: var(--warning); }
+.nd-badge.success { background: rgba(34,197,94,.12); color: var(--success); }
+.nd-badge.failed  { background: rgba(239,68,68,.12); color: var(--danger); }
+.nd-result { font-size: .65rem; color: var(--text-muted); margin-top: 3px; white-space: nowrap; overflow: hidden; text-overflow: ellipsis; }
+.sdot { width: 5px; height: 5px; border-radius: 50%; display: inline-block; flex-shrink: 0; }
+.sdot.pending { background: var(--text-muted); }
+.sdot.running { background: var(--warning); animation: blink 1s step-start infinite; }
+.sdot.success { background: var(--success); }
+.sdot.failed  { background: var(--danger); }
+@keyframes blink { 0%,100%{opacity:1} 50%{opacity:0} }
+/* ── Config panel ─────────────────────────────────────────────────────────── */
+.ps-cfg {
+  width: 0; overflow: hidden; flex-shrink: 0;
+  background: var(--bg-secondary);
+  border-left: 1px solid var(--border-color);
+  display: flex; flex-direction: column;
+  transition: width .24s cubic-bezier(.4,0,.2,1);
+}
+.ps-cfg.open { width: 296px; }
+.cfg-hdr {
+  display: flex; align-items: center; justify-content: space-between;
+  padding: 11px 13px; flex-shrink: 0;
+  border-bottom: 1px solid var(--border-color);
+  font-size: .8rem; font-weight: 600; color: var(--text-secondary);
+}
+.cfg-body { flex: 1; overflow-y: auto; padding: 14px; }
+.cfg-node-hdr {
+  display: flex; align-items: flex-start; gap: 10px;
+  padding-bottom: 13px; margin-bottom: 13px;
+  border-bottom: 1px solid var(--border-color);
+}
+.cfg-node-icon  { font-size: 1.5rem; flex-shrink: 0; line-height: 1; }
+.cfg-node-title { font-size: .9rem; font-weight: 600; line-height: 1.3; }
+.cfg-node-desc  { font-size: .76rem; color: var(--text-secondary); margin-top: 4px; line-height: 1.5; }
+.cfg-sec { margin-bottom: 16px; }
+.cfg-lbl {
+  display: block; margin-bottom: 6px;
+  font-size: .69rem; font-weight: 700; letter-spacing: .08em;
+  text-transform: uppercase; color: var(--text-muted);
+}
+.cfg-select {
+  width: 100%; background: var(--bg-tertiary); border: 1px solid var(--border-color);
+  color: var(--text-primary); border-radius: 6px; padding: 7px 28px 7px 10px;
+  font-size: .82rem; outline: none; cursor: pointer; appearance: none;
+  transition: border-color .15s;
+  background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' width='12' height='8' viewBox='0 0 12 8'%3E%3Cpath d='M1 1l5 5 5-5' stroke='%23656d76' stroke-width='1.5' fill='none' stroke-linecap='round'/%3E%3C/svg%3E");
+  background-repeat: no-repeat; background-position: right 9px center;
+}
+.cfg-select:focus { border-color: var(--accent); }
+.cfg-row {
+  display: flex; justify-content: space-between; align-items: flex-start;
+  padding: 6px 0; border-bottom: 1px solid var(--border-color); font-size: .79rem;
+}
+.cfg-row:last-child { border-bottom: none; }
+.cfg-row-k { color: var(--text-muted); white-space: nowrap; padding-right: 8px; }
+.cfg-row-v { color: var(--text-primary); font-weight: 500; text-align: right; word-break: break-word; max-width: 62%; font-size: .77rem; }
+/* ── Terminal ─────────────────────────────────────────────────────────────── */
+.ps-term {
+  flex-shrink: 0; height: 34px; overflow: hidden;
+  background: #07090d;
+  border-top: 1px solid var(--border-color);
+  transition: height .22s cubic-bezier(.4,0,.2,1);
+}
+.ps-term.expanded { height: 188px; }
+.term-hdr {
+  display: flex; align-items: center; gap: 5px;
+  height: 34px; padding: 0 14px;
+  cursor: pointer; user-select: none;
+  border-bottom: 1px solid var(--border-color);
+  font-family: 'Fira Code', monospace; font-size: .72rem;
+  color: var(--text-secondary);
+}
+.term-hdr:hover { background: rgba(255,255,255,.02); }
+.term-body {
+  height: calc(100% - 34px); overflow-y: auto;
+  padding: 7px 14px;
+  font-family: 'Fira Code', monospace; font-size: .71rem;
+  color: #8b949e; line-height: 1.65;
+}
+.l-ok   { color: #22c55e; }
+.l-err  { color: #ef4444; }
+.l-info { color: #f59e0b; }
+.l-dim  { color: #3d4450; }
+</style>
+{% endblock %}
 {% block content %}
+<div class="ps">
+  <!-- ── Toolbar ─────────────────────────────────────────────────────────── -->
+  <div class="ps-toolbar">
+    <div class="ps-tabs">
+      <button class="ps-tab active" onclick="switchPipeline('training_pipeline',this)">
+        <i class="fa-solid fa-brain"></i> Training
+      </button>
+      <button class="ps-tab" onclick="switchPipeline('retraining_pipeline',this)">
+        <i class="fa-solid fa-rotate"></i> Retraining
+      </button>
+      <button class="ps-tab" onclick="switchPipeline('data_pipeline',this)">
+        <i class="fa-solid fa-database"></i> Data
       </button>
     </div>
+    <div class="ps-info">
+      <div class="ps-name" id="ps-name">—</div>
+      <div class="ps-desc" id="ps-desc">—</div>
+    </div>
+    <div class="ps-badge idle" id="ps-badge">
+      <span class="sdot pending" id="ps-dot"></span>
+      <span id="ps-badge-txt">Idle</span>
+    </div>
+    <button class="ps-run-btn" id="ps-run-btn" onclick="runPipeline()">
+      <i class="fa-solid fa-play" id="ps-btn-icon"></i>
+      <span id="ps-btn-txt">Execute DAG</span>
+    </button>
   </div>
+  <!-- ── Main area ──────────────────────────────────────────────────────── -->
+  <div class="ps-main">
+    <!-- DAG Canvas -->
+    <div class="ps-canvas" id="ps-canvas">
+      <div class="ps-canvas-inner" id="ps-ci">
+        <svg class="dag-arrows" id="dag-svg" width="1" height="1"></svg>
+        <!-- nodes injected by JS -->
       </div>
     </div>
+    <!-- Config panel (slides in) -->
+    <div class="ps-cfg" id="ps-cfg">
+      <div class="cfg-hdr">
+        <span><i class="fa-solid fa-sliders" style="color:var(--accent);margin-right:6px"></i>Node Config</span>
+        <button class="btn btn-ghost btn-sm" onclick="closeConfig()" title="Close">
+          <i class="fa-solid fa-xmark"></i>
+        </button>
+      </div>
+      <div class="cfg-body" id="cfg-body">
+        <div style="text-align:center;padding:36px 0 28px;color:var(--text-muted);font-size:.82rem">
+          <i class="fa-solid fa-arrow-pointer" style="font-size:1.5rem;opacity:.3;display:block;margin-bottom:10px"></i>
+          Click any node to configure it
+        </div>
+      </div>
+    </div>
   </div>
+  <!-- ── Execution terminal ─────────────────────────────────────────────── -->
+  <div class="ps-term" id="ps-term">
+    <div class="term-hdr" onclick="toggleTerm()">
+      <span style="color:#ff5f56;font-size:.5rem">●</span>
+      <span style="color:#ffbd2e;font-size:.5rem">●</span>
+      <span style="color:#27c93f;font-size:.5rem">●</span>
+      <span style="margin-left:8px;color:var(--warning);letter-spacing:.05em">EXECUTION LOG</span>
+      <span id="term-pct" style="margin-left:8px;color:var(--text-muted)"></span>
+      <span style="margin-left:auto" id="term-caret"><i class="fa-solid fa-chevron-up"></i></span>
+    </div>
+    <div class="term-body" id="term-body">
+      <div class="l-dim"># Waiting for pipeline execution…</div>
     </div>
   </div>
 </div>
 {% endblock %}
 {% block scripts %}
 <script>
+// ── Data ──────────────────────────────────────────────────────────────────────
+const DAGS     = {{ dags | safe }};
+const DATASETS = {{ datasets | tojson }};
+// ── State ─────────────────────────────────────────────────────────────────────
+let cur       = 'training_pipeline';
+let execId    = null;
+let pollIv    = null;
+let selNode   = null;
+let tstates   = {};
+let _seenLogs = 0;
+// Pipeline context — updated via config panel; used when running
+let pCtx = {
+  dataset:   Object.keys(DATASETS)[0] || 'Iris Flowers',
+  category:  'Tree-Based',
+  algorithm: 'Random Forest',
+  task_type: 'classification',
 };
+// Layout
+const NW=130, NH=64, HGAP=68, VGAP=24, PX=44, PY=44;
+// Which nodes show config controls (purple dot)
+const CFG_TYPE = { load_data:'dataset', ingest:'dataset', train:'algorithm', retrain:'algorithm' };
+// Node positions (populated in renderDAG)
+let npos = {};
+// ── Init ──────────────────────────────────────────────────────────────────────
+document.addEventListener('DOMContentLoaded', () =>
+  switchPipeline('training_pipeline', document.querySelector('.ps-tab.active')));
+// ── Pipeline switch ───────────────────────────────────────────────────────────
 function switchPipeline(id, btn) {
   if (pollIv) { clearInterval(pollIv); pollIv = null; }
+  cur = id; execId = null; tstates = {}; selNode = null;
+  closeConfig(false);
+  document.querySelectorAll('.ps-tab').forEach(b => b.classList.remove('active'));
   btn.classList.add('active');
+  const d = DAGS[id];
+  document.getElementById('ps-name').textContent = d.name;
+  document.getElementById('ps-desc').textContent = d.description;
+  renderDAG(d, {});
+  _setBadge('idle');
+  _resetTerm();
+  _resetBtn();
+}
+// ── DAG rendering ─────────────────────────────────────────────────────────────
+function renderDAG(dag, states) {
+  states = states || {};
+  const tasks = Object.values(dag.tasks);
+  const layers = {};
+  tasks.forEach(t => (layers[t.layer] = layers[t.layer] || []).push(t));
+  const maxL = Math.max(...tasks.map(t => t.layer));
+  const maxN = Math.max(...Object.values(layers).map(ts => ts.length));
+  // Compute positions (center-align multi-node layers)
+  npos = {};
+  Object.entries(layers).forEach(([li, ts]) => {
+    const x = PX + +li * (NW + HGAP);
+    const totalH = ts.length * NH + Math.max(0, ts.length-1) * VGAP;
+    const baseY  = PY + (maxN * (NH+VGAP) - totalH) / 2;
+    ts.forEach((t, i) => { npos[t.task_id] = { x, y: baseY + i*(NH+VGAP) }; });
   });
+  const cw = PX*2 + (maxL+1)*NW + maxL*HGAP;
+  const ch = PY*2 + maxN*NH + Math.max(0,maxN-1)*VGAP;
+  const ci = document.getElementById('ps-ci');
+  ci.style.width  = Math.max(cw,400)+'px';
+  ci.style.height = Math.max(ch,320)+'px';
+  // Remove old nodes
+  ci.querySelectorAll('.dag-node').forEach(e => e.remove());
+  // Create nodes
   tasks.forEach(t => {
+    const p   = npos[t.task_id];
+    const st  = (states[t.task_id]||{}).status || 'pending';
+    const res = (states[t.task_id]||{}).result  || '';
+    const sel = t.task_id === selNode;
+    const cfg = !!CFG_TYPE[t.task_id];
+    const el = document.createElement('div');
+    el.className = `dag-node s-${st}${sel?' selected':''}${cfg?' configurable':''}`;
+    el.id = 'node-'+t.task_id;
+    el.style.cssText = `left:${p.x}px;top:${p.y}px;width:${NW}px`;
+    el.innerHTML = `
+      <span class="nd-icon">${t.icon}</span>
+      <div class="nd-name">${t.name}</div>
+      <div class="nd-badge ${st}">
+        <span class="sdot ${st}"></span>${st}
+      </div>
+      ${res?`<div class="nd-result" title="${res}">${res}</div>`:''}
+    `;
+    el.addEventListener('click', () => openConfig(t.task_id));
+    ci.appendChild(el);
   });
+  // Arrows
+  _drawArrows(dag, states, Math.max(cw,400), Math.max(ch,320));
+}
+function _drawArrows(dag, states, w, h) {
+  const svg = document.getElementById('dag-svg');
+  svg.setAttribute('width', w);
+  svg.setAttribute('height', h);
+  svg.innerHTML = `
+    <defs>
+      <marker id="ah" markerWidth="8" markerHeight="6" refX="7" refY="3" orient="auto">
+        <polygon points="0 0,8 3,0 6" fill="var(--border-color)"/>
+      </marker>
+      <marker id="ah-ok" markerWidth="8" markerHeight="6" refX="7" refY="3" orient="auto">
+        <polygon points="0 0,8 3,0 6" fill="#22c55e66"/>
+      </marker>
+    </defs>`;
+  Object.values(dag.tasks).forEach(t => {
+    t.upstream.forEach(uid => {
+      const a = npos[uid], b = npos[t.task_id];
+      if (!a||!b) return;
+      const x1=a.x+NW, y1=a.y+NH/2, x2=b.x, y2=b.y+NH/2, cx=(x1+x2)/2;
+      const uSt=(states[uid]||{}).status||'pending';
+      const tSt=(states[t.task_id]||{}).status||'pending';
+      const ok = uSt==='success'&&tSt==='success';
+      const p  = document.createElementNS('http://www.w3.org/2000/svg','path');
+      p.setAttribute('d', `M${x1},${y1} C${cx},${y1} ${cx},${y2} ${x2},${y2}`);
+      p.setAttribute('stroke', ok?'#22c55e55':'var(--border-color)');
+      p.setAttribute('stroke-width','1.5');
+      p.setAttribute('fill','none');
+      p.setAttribute('marker-end',`url(#${ok?'ah-ok':'ah'})`);
+      svg.appendChild(p);
+    });
   });
+}
+// ── Config panel ──────────────────────────────────────────────────────────────
+async function openConfig(taskId) {
+  selNode = taskId;
+  const dag  = DAGS[cur];
+  const task = dag.tasks[taskId];
+  const st   = (tstates[taskId]||{}).status  || 'pending';
+  const res  = (tstates[taskId]||{}).result  || null;
+  const err  = (tstates[taskId]||{}).error   || null;
+  const cfgT = CFG_TYPE[taskId];
+  const stClr= {running:'var(--warning)',success:'var(--success)',failed:'var(--danger)'}[st]||'var(--text-muted)';
+  // Highlight node
+  document.querySelectorAll('.dag-node').forEach(e => e.classList.remove('selected'));
+  const ne = document.getElementById('node-'+taskId);
+  if (ne) ne.classList.add('selected');
+  let html = `
+    <div class="cfg-node-hdr">
+      <span class="cfg-node-icon">${task.icon}</span>
+      <div>
+        <div class="cfg-node-title">${task.name}</div>
+        <div class="cfg-node-desc">${task.description}</div>
+      </div>
+    </div>
+    <!-- Status (always visible, updated in-place) -->
+    <div class="cfg-sec">
+      <span class="cfg-lbl">Status</span>
+      <div class="cfg-row">
+        <span class="cfg-row-k">State</span>
+        <span class="cfg-row-v" id="cfg-st" style="color:${stClr}">${st.toUpperCase()}</span>
       </div>
+      <div class="cfg-row" id="cfg-res-row" style="${res?'':'display:none'}">
+        <span class="cfg-row-k">Result</span>
+        <span class="cfg-row-v" id="cfg-res">${res||''}</span>
+      </div>
+      <div class="cfg-row" id="cfg-err-row" style="${err?'':'display:none'}">
+        <span class="cfg-row-k">Error</span>
+        <span class="cfg-row-v" id="cfg-err" style="color:var(--danger)">${err||''}</span>
+      </div>
+    </div>
+  `;
+  // Inputs for configurable nodes
+  if (cfgT === 'dataset') {
+    html += `
+      <div class="cfg-sec">
+        <label class="cfg-lbl" for="cfg-ds">Dataset</label>
+        <select class="cfg-select" id="cfg-ds" onchange="pCtx.dataset=this.value">
+          ${Object.keys(DATASETS).map(n=>`<option${n===pCtx.dataset?' selected':''}>${n}</option>`).join('')}
+        </select>
+      </div>`;
+  } else if (cfgT === 'algorithm') {
+    html += `
+      <div class="cfg-sec">
+        <label class="cfg-lbl" for="cfg-tt">Task Type</label>
+        <select class="cfg-select" id="cfg-tt" onchange="onTtChange(this.value)">
+          <option value="classification"${pCtx.task_type==='classification'?' selected':''}>Classification</option>
+          <option value="regression"${pCtx.task_type==='regression'?' selected':''}>Regression</option>
+        </select>
+      </div>
+      <div class="cfg-sec">
+        <label class="cfg-lbl" for="cfg-cat">Category</label>
+        <select class="cfg-select" id="cfg-cat"><option>Loading…</option></select>
+      </div>
+      <div class="cfg-sec">
+        <label class="cfg-lbl" for="cfg-alg">Algorithm</label>
+        <select class="cfg-select" id="cfg-alg" onchange="pCtx.algorithm=this.value"><option>Loading…</option></select>
+      </div>`;
+  }
+  // Upstream deps
+  if (task.upstream && task.upstream.length) {
+    html += `<div class="cfg-sec"><span class="cfg-lbl">Upstream</span>`;
+    task.upstream.forEach(uid => {
+      const up   = dag.tasks[uid];
+      const upSt = (tstates[uid]||{}).status||'pending';
+      html += `<div class="cfg-row">
+        <span class="cfg-row-k">${up?up.icon+' '+up.name:uid}</span>
+        <span class="nd-badge ${upSt}" style="font-size:.65rem;padding:1px 6px">
+          <span class="sdot ${upSt}"></span>${upSt}
+        </span>
+      </div>`;
+    });
+    html += `</div>`;
+  }
+  document.getElementById('cfg-body').innerHTML = html;
+  document.getElementById('ps-cfg').classList.add('open');
+  if (cfgT === 'algorithm') await _loadAlgos(pCtx.task_type);
+}
+function closeConfig(redraw=true) {
+  document.getElementById('ps-cfg').classList.remove('open');
+  if (redraw) document.querySelectorAll('.dag-node').forEach(e => e.classList.remove('selected'));
+  selNode = null;
+}
+// Update only the status bits in the open config panel (called during polling)
+function _updateCfgStatus() {
+  if (!selNode) return;
+  const st  = (tstates[selNode]||{}).status  || 'pending';
+  const res = (tstates[selNode]||{}).result  || null;
+  const err = (tstates[selNode]||{}).error   || null;
+  const stClr={running:'var(--warning)',success:'var(--success)',failed:'var(--danger)'}[st]||'var(--text-muted)';
+  const stEl = document.getElementById('cfg-st');
+  if (stEl) { stEl.textContent = st.toUpperCase(); stEl.style.color = stClr; }
+  const rRow = document.getElementById('cfg-res-row');
+  const rEl  = document.getElementById('cfg-res');
+  if (rRow && rEl && res) { rRow.style.display=''; rEl.textContent=res; }
+  const eRow = document.getElementById('cfg-err-row');
+  const eEl  = document.getElementById('cfg-err');
+  if (eRow && eEl && err) { eRow.style.display=''; eEl.textContent=err; }
 }
+// ── Algorithm dropdowns ───────────────────────────────────────────────────────
+let _algoData = null;
+async function _loadAlgos(tt) {
+  try {
+    const r = await fetch(`/api/algorithms?task=${tt}`);
+    _algoData = await r.json();
+    const cats = Object.keys(_algoData);
+    const catSel = document.getElementById('cfg-cat');
+    if (!catSel) return;
+    catSel.innerHTML = cats.map(c=>`<option${c===pCtx.category?' selected':''}>${c}</option>`).join('');
+    const cat = cats.includes(pCtx.category)?pCtx.category:cats[0];
+    catSel.value = cat; pCtx.category = cat;
+    catSel.onchange = e => onCatChange(e.target.value);
+    _fillAlgos(cat);
+  } catch(e) {}
+}
+function _fillAlgos(cat) {
+  const algs = _algoData&&_algoData[cat]?Object.keys(_algoData[cat]):[];
+  const sel  = document.getElementById('cfg-alg');
+  if (!sel) return;
+  sel.innerHTML = algs.map(a=>`<option${a===pCtx.algorithm?' selected':''}>${a}</option>`).join('');
+  const alg = algs.includes(pCtx.algorithm)?pCtx.algorithm:algs[0]||'';
+  sel.value = alg; pCtx.algorithm = alg;
+  sel.onchange = e => { pCtx.algorithm = e.target.value; };
+}
+async function onTtChange(tt) {
+  pCtx.task_type = tt; pCtx.category=''; pCtx.algorithm='';
+  await _loadAlgos(tt);
+}
+function onCatChange(cat) { pCtx.category=cat; _fillAlgos(cat); }
 // ── Execute pipeline ──────────────────────────────────────────────────────────
 async function runPipeline() {
+  const runBtn = document.getElementById('ps-run-btn');
+  runBtn.disabled = true;
+  document.getElementById('ps-btn-icon').className = 'spinner';
+  document.getElementById('ps-btn-txt').textContent = 'Running…';
+  _setBadge('running');
+  _openTerm();
+  _addLog(`$ ${DAGS[cur].name}`, 'info');
   const ctx = {};
+  if (cur === 'training_pipeline') {
+    Object.assign(ctx, { dataset:pCtx.dataset, category:pCtx.category,
+                          algorithm:pCtx.algorithm, task_type:pCtx.task_type });
+    _addLog(`  dataset="${ctx.dataset}"  algorithm="${ctx.algorithm}"`, 'dim');
   }
   try {
+    const r = await fetch(`/api/pipeline/${cur}/execute`, {
+      method:'POST', headers:{'Content-Type':'application/json'},
       body: JSON.stringify(ctx),
     });
+    const d = await r.json();
+    if (d.error) { _execFailed(d.error); return; }
+    execId = d.exec_id;
+    _addLog(`  engine=${d.engine||'builtin'}  id=${d.exec_id}`, 'dim');
+    _poll();
+  } catch(e) { _execFailed(e.message); }
 }
+function _poll() {
+  _seenLogs = 0;
   if (pollIv) clearInterval(pollIv);
   pollIv = setInterval(async () => {
+    try {
+      const r    = await fetch(`/api/pipeline/status/${execId}`);
+      const exec = await r.json();
+      tstates = exec.task_states || {};
+      // Sync new log lines
+      const lines = exec.logs||[];
+      if (lines.length > _seenLogs) {
+        lines.slice(_seenLogs).forEach(ln => {
+          if (!ln) return;
+          let c='dim';
+          if (ln.includes('✔')) c='ok';
+          else if (ln.includes('✖')||ln.toLowerCase().includes('fail')) c='err';
+          else if (ln.includes('▶')) c='info';
+          _addLog(ln, c);
+        });
+        _seenLogs = lines.length;
+      }
+      document.getElementById('term-pct').textContent = exec.progress!=null?exec.progress+'%':'';
+      renderDAG(DAGS[cur], tstates);
+      _updateCfgStatus();
+      if (exec.status==='completed') {
+        clearInterval(pollIv); pollIv=null;
+        _setBadge('success');
+        _addLog('✔ Pipeline completed successfully', 'ok');
+        document.getElementById('ps-btn-icon').className = 'fa-solid fa-rotate-right';
+        document.getElementById('ps-btn-txt').textContent = 'Run Again';
+        document.getElementById('ps-run-btn').disabled = false;
+        showToast(`${DAGS[cur].name} completed`,'success');
+      } else if (exec.status==='failed') {
+        clearInterval(pollIv); pollIv=null;
+        _setBadge('failed');
+        _addLog('✖ '+(exec.error||'Pipeline failed'),'err');
+        _resetBtn();
+        showToast('Pipeline failed','error');
+      }
+    } catch(e) {}
+  }, 900);
+}
+function _execFailed(msg) { _addLog('✖ '+msg,'err'); _setBadge('failed'); _resetBtn(); }
+// ── Helpers ───────────────────────────────────────────────────────────────────
+function _setBadge(s) {
+  const labels={idle:'Idle',running:'Running',success:'Completed',failed:'Failed'};
+  document.getElementById('ps-badge').className = 'ps-badge '+s;
+  document.getElementById('ps-dot').className   = 'sdot '+(s==='idle'?'pending':s);
+  document.getElementById('ps-badge-txt').textContent = labels[s]||s;
+}
+function _resetBtn() {
+  btn().disabled = false;
+  document.getElementById('ps-btn-icon').className = 'fa-solid fa-play';
+  document.getElementById('ps-btn-txt').textContent = 'Execute DAG';
+}
+function _addLog(txt, cls) {
+  const b  = document.getElementById('term-body');
+  const el = document.createElement('div');
+  el.className = 'l-'+(cls||'dim'); el.textContent = txt;
+  b.appendChild(el); b.scrollTop = b.scrollHeight;
+}
+function _openTerm() {
+  document.getElementById('term-body').innerHTML = '';
+  document.getElementById('ps-term').classList.add('expanded');
+  document.getElementById('term-caret').innerHTML = '<i class="fa-solid fa-chevron-down"></i>';
+}
+function toggleTerm() {
+  const el = document.getElementById('ps-term');
+  const ex = el.classList.contains('expanded');
+  el.classList.toggle('expanded',!ex);
+  document.getElementById('term-caret').innerHTML =
+    `<i class="fa-solid fa-chevron-${ex?'up':'down'}"></i>`;
+}
+function _resetTerm() {
+  document.getElementById('term-body').innerHTML = '<div class="l-dim"># Waiting for pipeline execution…</div>';
+  document.getElementById('term-pct').textContent='';
+  document.getElementById('ps-term').classList.remove('expanded');
+  document.getElementById('term-caret').innerHTML='<i class="fa-solid fa-chevron-up"></i>';
+}
 </script>
 {% endblock %}