LLM / Dockerfile
dpv007's picture
Update Dockerfile
4756ce1 verified
Raw
History Blame Contribute Delete
938 Bytes
# Use a lightweight Python 3.10 base image
FROM python:3.10-slim
# 1. Hugging Face strictly requires running as a non-root user (UID 1000)
RUN useradd -m -u 1000 user
USER user
# 2. Set up environment variables for the user
ENV HOME=/home/user \
PATH=/home/user/.local/bin:$PATH
# 3. Set the working directory
WORKDIR $HOME/app
# 4. Copy requirements first to leverage Docker layer caching
COPY --chown=user requirements.txt $HOME/app/
# 5. Install dependencies, using the pre-built CPU wheel to bypass compilation
RUN pip install --no-cache-dir --upgrade pip && \
pip install --no-cache-dir -r requirements.txt \
--extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
# 6. Copy the main application code
COPY --chown=user app.py $HOME/app/
# 7. Expose port 7860 (The standard port for HF Spaces)
EXPOSE 7860
# 8. Start the Uvicorn server
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]