dengcao
/

Qwen3-Embedding-4B

Feature Extraction

sentence-transformers

sentence-similarity

text-embeddings-inference

Model card Files Files and versions

Qwen3-Embedding-4B / docker-compose.yaml

dengcao's picture

Update docker-compose.yaml

0df841e verified 10 months ago

history blame contribute delete

668 Bytes

	services:
	Qwen3-Embedding-4B:
	container_name: Qwen3-Embedding-4B
	restart: no
	#image: dengcao/vllm-openai:v0.9.2-dev #采用vllm最新的开发版制作的镜像，经测试正常，可放心使用
	#image: dengcao/vllm-openai:v0.9.2rc2
	image: dengcao/vllm-openai:v0.9.2
	ipc: host
	volumes:
	- ./models:/models
	command: ["--model", "/models/Qwen3-Embedding-4B", "--served-model-name", "Qwen3-Embedding-4B", "--gpu-memory-utilization", "0.90"]
	ports:
	- 8008:8000
	deploy:
	resources:
	reservations:
	devices:
	- driver: nvidia
	count: all
	capabilities: [gpu]