# GPU-enabled Dockerfile for DGX Spark deployment (ARM64/aarch64 + CUDA 13.0) FROM nvidia/cuda:12.4.0-runtime-ubuntu22.04 # Install Python and system dependencies RUN apt-get update && apt-get install -y \ python3 \ python3-pip \ python3-dev \ curl \ build-essential \ && rm -rf /var/lib/apt/lists/* \ && ln -s /usr/bin/python3 /usr/bin/python WORKDIR /app # Install PyTorch with CUDA support first (before other requirements) # Using CUDA 12.4 wheels which are compatible with CUDA 13.0 driver RUN pip3 install --no-cache-dir \ torch \ --index-url https://download.pytorch.org/whl/cu124 # Copy requirements and install (excluding packages with ARM64 issues) COPY requirements.txt . RUN grep -v "^torch==" requirements.txt | \ grep -v "^zarr==" | \ grep -v "^numcodecs==" > requirements-spark.txt && \ pip3 install --no-cache-dir -r requirements-spark.txt # Copy backend code COPY backend/ ./backend/ COPY app.py . # Create runs directory RUN mkdir -p /app/runs # Health check (uses configurable port via environment) HEALTHCHECK --interval=30s --timeout=3s --start-period=60s --retries=3 \ CMD curl -f http://localhost:${PORT:-8000}/health || exit 1 # Expose configurable port EXPOSE ${PORT:-8000} # Default command (overridden by compose.spark.yml) CMD ["uvicorn", "backend.model_service:app", "--host", "0.0.0.0", "--port", "8000"]