ocr_paligemma / Dockerfile
rockerritesh's picture
Update Dockerfile
3394521 verified
# Use an official Python runtime as a parent image
FROM python:3.9-slim
# Set the working directory
WORKDIR /app
# Install necessary system dependencies
RUN apt-get update && apt-get install -y gcc && rm -rf /var/lib/apt/lists/*
# Install system dependencies
RUN apt-get update && apt-get install -y \
poppler-utils \
build-essential \
python3-dev \
python3-distutils \
cmake \
libglib2.0-0 \
libsm6 \
libxext6 \
libxrender-dev \
libgl1-mesa-glx \
ffmpeg \
&& apt-get clean \
&& rm -rf /var/lib/apt/lists/*
# Set the CC environment variable to ensure TorchInductor uses the correct compiler
ENV CC=gcc
# Copy the requirements file and install dependencies
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt
# Create cache and config directories with appropriate permissions
RUN mkdir -p /app/cache && chmod 777 /app/cache
RUN mkdir -p /app/config && chmod 777 /app/config
RUN mkdir -p /app/triton_cache && chmod 777 /app/triton_cache
RUN mkdir -p /app/torchinductor_cache && chmod 777 /app/torchinductor_cache
RUN mkdir -p /mnt/data && chmod 777 /mnt/data
# Create directories for Matplotlib and Fontconfig with appropriate permissions
RUN mkdir -p /app/matplotlib && chmod 777 /app/matplotlib
RUN mkdir -p /app/fontconfig && chmod 777 /app/fontconfig
# Set environment variables for Hugging Face cache, config, Triton, and TorchInductor directories
ENV HF_HOME=/app/cache
ENV XDG_CONFIG_HOME=/app/config
ENV TRITON_CACHE_DIR=/app/triton_cache
ENV TORCHINDUCTOR_CACHE_DIR=/app/torchinductor_cache
ENV MPLCONFIGDIR=/app/matplotlib
ENV FONTCONFIG_PATH=/app/fontconfig
ENV XDG_CACHE_HOME=/app/cache
# Copy the application code
COPY main.py .
COPY utils.py utils_ocr.py .
COPY ocr /app/ocr
# Expose the port FastAPI will run on
EXPOSE 7860
# Command to run the FastAPI app
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860", "--workers","4"]