open-finance-llm-8b / Dockerfile.koyeb
jeanbaptdzd's picture
Cleanup: remove redundant docs, condense README
7a92d8e
raw
history blame contribute delete
627 Bytes
# Koyeb-optimized Dockerfile using official vLLM OpenAI image
# Compatible with Koyeb's one-click deployment patterns for Qwen + vLLM
# Uses ENTRYPOINT to ensure args aren't overridden by Koyeb
FROM vllm/vllm-openai:latest
# Environment variables
ENV HF_HOME=/tmp/huggingface \
VLLM_ATTENTION_BACKEND=FLASH_ATTN
# Create cache directories
RUN mkdir -p /tmp/huggingface && chmod 777 /tmp/huggingface
# Copy startup script
COPY start-vllm.sh /start-vllm.sh
RUN chmod +x /start-vllm.sh
# Expose vLLM default port
EXPOSE 8000
# Use ENTRYPOINT so it can't be overridden by empty Koyeb args
ENTRYPOINT ["/start-vllm.sh"]