Qwen3-Embedding-4B / docker-compose.yaml
dengcao's picture
Update docker-compose.yaml
0df841e verified
services:
Qwen3-Embedding-4B:
container_name: Qwen3-Embedding-4B
restart: no
#image: dengcao/vllm-openai:v0.9.2-dev #采用vllm最新的开发版制作的镜像,经测试正常,可放心使用
#image: dengcao/vllm-openai:v0.9.2rc2
image: dengcao/vllm-openai:v0.9.2
ipc: host
volumes:
- ./models:/models
command: ["--model", "/models/Qwen3-Embedding-4B", "--served-model-name", "Qwen3-Embedding-4B", "--gpu-memory-utilization", "0.90"]
ports:
- 8008:8000
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]