File size: 2,119 Bytes
09cd93c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bdf714a
 
 
 
 
 
09cd93c
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
# ===============================
# Stage 1: Build Frontend
# ===============================
# Cache bust: 2025-12-28 fix
FROM node:20-alpine AS frontend-builder

WORKDIR /frontend

COPY FRRONTEEEND/package*.json ./
RUN npm install

COPY FRRONTEEEND/ ./
RUN npm run build


# ===============================
# Stage 2: Build Python environment
# ===============================
FROM python:3.12-slim AS builder

# Install build dependencies (needed for ML wheels)
RUN apt-get update && apt-get install -y --no-install-recommends \
    gcc \
    g++ \
    make \
    && rm -rf /var/lib/apt/lists/*

# Create virtual environment
RUN python -m venv /opt/venv
ENV PATH="/opt/venv/bin:$PATH"

# Upgrade pip tooling
RUN pip install --upgrade pip setuptools wheel

# Install Python dependencies
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt


# ===============================
# Stage 3: Runtime environment
# ===============================
FROM python:3.12-slim

# Install runtime shared libraries
RUN apt-get update && apt-get install -y --no-install-recommends \
    libgomp1 \
    libstdc++6 \
    && rm -rf /var/lib/apt/lists/*

# Copy virtual environment
COPY --from=builder /opt/venv /opt/venv
ENV PATH="/opt/venv/bin:$PATH"

# App working directory
WORKDIR /app

# Copy backend code
COPY src/ /app/src/
COPY examples/ /app/examples/

# Copy frontend build
COPY --from=frontend-builder /frontend/dist /app/FRRONTEEEND/dist

# Cloud Run ephemeral directories
RUN mkdir -p \
    /tmp/data_science_agent \
    /tmp/outputs/models \
    /tmp/outputs/plots \
    /tmp/outputs/reports \
    /tmp/outputs/data \
    /tmp/cache_db

# Environment variables
ENV PYTHONUNBUFFERED=1
ENV PORT=8080
ENV OUTPUT_DIR=/tmp/outputs
ENV CACHE_DB_PATH=/tmp/cache_db/cache.db
ENV ARTIFACT_BACKEND=local

# YData Profiling optimization for 512MB RAM (Render Free Tier)
# Lower thresholds = aggressive sampling to prevent crashes
ENV YDATA_MAX_ROWS=50000
ENV YDATA_MAX_SIZE_MB=10
ENV YDATA_SAMPLE_SIZE=50000

EXPOSE 8080

# Start FastAPI
CMD ["uvicorn", "src.api.app:app", "--host", "0.0.0.0", "--port", "8080"]