FROM python:3.10-slim # Set working directory WORKDIR /app # Set environment variables ENV PYTHONUNBUFFERED=1 \ PYTHONDONTWRITEBYTECODE=1 \ PIP_NO_CACHE_DIR=1 \ PIP_DISABLE_PIP_VERSION_CHECK=1 \ TRANSFORMERS_CACHE=/app/.cache/transformers \ HF_HOME=/app/.cache/huggingface \ DEBIAN_FRONTEND=noninteractive # Install system dependencies RUN apt-get update && apt-get install -y --no-install-recommends \ git \ git-lfs \ build-essential \ curl \ ca-certificates \ && git lfs install \ && rm -rf /var/lib/apt/lists/* \ && apt-get clean # Upgrade pip and install build tools RUN pip install --no-cache-dir --upgrade \ pip==24.0 \ setuptools==69.5.1 \ wheel==0.43.0 # Copy requirements first for better Docker caching COPY requirements.txt . # Install Python dependencies RUN pip install --no-cache-dir -r requirements.txt # Copy application code COPY app/ ./app/ # Create necessary directories with proper permissions RUN mkdir -p /app/offload /app/.cache/transformers /app/.cache/huggingface && \ chmod -R 777 /app/offload /app/.cache # Expose port 7860 (HuggingFace Spaces standard) EXPOSE 7860 # Health check - more lenient for model loading HEALTHCHECK --interval=30s --timeout=20s --start-period=300s --retries=5 \ CMD curl -f http://localhost:7860/health || exit 1 # Run the application with increased timeouts CMD ["uvicorn", "app.api:app", \ "--host", "0.0.0.0", \ "--port", "7860", \ "--timeout-keep-alive", "300", \ "--workers", "1", \ "--log-level", "info"]