FROM python:3.10.9 # Set the working directory to /app WORKDIR /app # Create a directory for storing downloaded PDF files RUN mkdir /app/downloads # Create a non-root user RUN useradd -m appuser # Copy the current directory contents into the container at /app COPY . /app # Install system dependencies RUN apt-get update && apt-get install -y \ libgl1-mesa-glx \ libglib2.0-0 \ poppler-utils \ tesseract-ocr # Install Python dependencies RUN pip install --no-cache-dir --upgrade -r /app/requirements.txt # Change ownership of the app directory to the non-root user RUN chown -R appuser:appuser /app # Switch to the non-root user USER appuser # Set the nltk_data directory path ENV NLTK_DATA /app/nltk_data CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]