dengcao
/

Qwen3-Reranker-8B

Model card Files Files and versions

dengcao commited on Jul 7, 2025

Commit

f68da82

·

verified ·

1 Parent(s): a422b39

Update docker-compose.yaml

Files changed (1) hide show

docker-compose.yaml +19 -18

docker-compose.yaml CHANGED Viewed

@@ -1,18 +1,19 @@
-services:
-  Qwen3-Reranker-8B:
-    container_name: Qwen3-Reranker-8B
-    restart: no
-    image: dengcao/vllm-openai:v0.9.2-dev #采用vllm最新的开发版制作的镜像，经在NVIDIA RTX3060平台主机上测试正常，可放心使用。
-    ipc: host
-    volumes:
-      - ./models:/models
-    command: ['--model', '/models/Qwen3-Reranker-8B',  '--served-model-name', 'Qwen3-Reranker-8B',  '--gpu-memory-utilization', '0.90', '--hf_overrides','{"architectures": ["Qwen3ForSequenceClassification"],"classifier_from_token": ["no", "yes"],"is_original_qwen3_reranker": true}']
-    ports:
-      - 8012:8000
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: all
-              capabilities: [gpu]

+services:
+  Qwen3-Reranker-8B:
+    container_name: Qwen3-Reranker-8B
+    restart: no
+    #image: dengcao/vllm-openai:v0.9.2-dev #采用vllm最新的开发版制作的镜像，经在NVIDIA RTX3060平台主机上测试正常，可放心使用。
+    image: dengcao/vllm-openai:v0.9.2rc2
+    ipc: host
+    volumes:
+      - ./models:/models
+    command: ['--model', '/models/Qwen3-Reranker-8B',  '--served-model-name', 'Qwen3-Reranker-8B',  '--gpu-memory-utilization', '0.90', '--hf_overrides','{"architectures": ["Qwen3ForSequenceClassification"],"classifier_from_token": ["no", "yes"],"is_original_qwen3_reranker": true}']
+    ports:
+      - 8012:8000
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]