dengcao
/

Qwen3-Reranker-8B

Model card Files Files and versions

Qwen3-Reranker-8B / docker-compose.yaml

dengcao's picture

Update docker-compose.yaml

4498658 verified 7 months ago

history blame contribute delete

849 Bytes

	services:
	Qwen3-Reranker-8B:
	container_name: Qwen3-Reranker-8B
	restart: no
	#image: dengcao/vllm-openai:v0.9.2-dev #采用vllm最新的开发版制作的镜像，经在NVIDIA RTX3060平台主机上测试正常，可放心使用。
	#image: dengcao/vllm-openai:v0.9.2rc2
	image: dengcao/vllm-openai:v0.9.2
	ipc: host
	volumes:
	- ./models:/models
	command: ['--model', '/models/Qwen3-Reranker-8B', '--served-model-name', 'Qwen3-Reranker-8B', '--gpu-memory-utilization', '0.90', '--hf_overrides','{"architectures": ["Qwen3ForSequenceClassification"],"classifier_from_token": ["no", "yes"],"is_original_qwen3_reranker": true}']
	ports:
	- 8012:8000
	deploy:
	resources:
	reservations:
	devices:
	- driver: nvidia
	count: all
	capabilities: [gpu]