medical-coding-api / Dockerfile
Distopia22's picture
Production-ready Medical Coding API with Phi-3 support
d03f587
raw
history blame
1.57 kB
FROM python:3.10-slim
# Set working directory
WORKDIR /app
# Set environment variables
ENV PYTHONUNBUFFERED=1 \
PYTHONDONTWRITEBYTECODE=1 \
PIP_NO_CACHE_DIR=1 \
PIP_DISABLE_PIP_VERSION_CHECK=1 \
TRANSFORMERS_CACHE=/app/.cache/transformers \
HF_HOME=/app/.cache/huggingface \
DEBIAN_FRONTEND=noninteractive
# Install system dependencies
RUN apt-get update && apt-get install -y --no-install-recommends \
git \
git-lfs \
build-essential \
curl \
ca-certificates \
&& git lfs install \
&& rm -rf /var/lib/apt/lists/* \
&& apt-get clean
# Upgrade pip and install build tools
RUN pip install --no-cache-dir --upgrade \
pip==24.0 \
setuptools==69.5.1 \
wheel==0.43.0
# Copy requirements first for better Docker caching
COPY requirements.txt .
# Install Python dependencies
RUN pip install --no-cache-dir -r requirements.txt
# Copy application code
COPY app/ ./app/
# Create necessary directories with proper permissions
RUN mkdir -p /app/offload /app/.cache/transformers /app/.cache/huggingface && \
chmod -R 777 /app/offload /app/.cache
# Expose port 7860 (HuggingFace Spaces standard)
EXPOSE 7860
# Health check - more lenient for model loading
HEALTHCHECK --interval=30s --timeout=20s --start-period=300s --retries=5 \
CMD curl -f http://localhost:7860/health || exit 1
# Run the application with increased timeouts
CMD ["uvicorn", "app.api:app", \
"--host", "0.0.0.0", \
"--port", "7860", \
"--timeout-keep-alive", "300", \
"--workers", "1", \
"--log-level", "info"]