|
|
FROM vllm/vllm-openai:latest |
|
|
|
|
|
WORKDIR /app |
|
|
|
|
|
|
|
|
COPY requirements.txt . |
|
|
RUN pip install --no-cache-dir -r requirements.txt |
|
|
|
|
|
|
|
|
ARG MODEL_REPO=Qwen/Qwen1.5-4B-Chat-AWQ |
|
|
ENV MODEL_DIR=/app/models/model |
|
|
ENV SERVED_MODEL_NAME=${MODEL_REPO} |
|
|
|
|
|
|
|
|
ARG HF_TOKEN |
|
|
ENV HUGGINGFACE_HUB_TOKEN=${HF_TOKEN} |
|
|
|
|
|
ENV HF_HUB_ENABLE_HF_TRANSFER=1 |
|
|
|
|
|
|
|
|
RUN mkdir -p "${MODEL_DIR}" && \ |
|
|
if [ -n "$HUGGINGFACE_HUB_TOKEN" ]; then \ |
|
|
huggingface-cli login --token "$HUGGINGFACE_HUB_TOKEN" --add-to-git-credential; \ |
|
|
fi && \ |
|
|
hf download "${MODEL_REPO}" --local-dir "${MODEL_DIR}" && \ |
|
|
ls -lh "${MODEL_DIR}" |
|
|
|
|
|
|
|
|
COPY app.py . |
|
|
COPY entrypoint.sh . |
|
|
RUN chmod +x /app/entrypoint.sh |
|
|
|
|
|
|
|
|
|
|
|
EXPOSE 8000 7860 |
|
|
|
|
|
|
|
|
|
|
|
ENTRYPOINT ["/app/entrypoint.sh"] |
|
|
|
|
|
|