Upload ms-swift/examples/infer/vllm/mllm_tp.sh with huggingface_hub
Browse files
ms-swift/examples/infer/vllm/mllm_tp.sh
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
CUDA_VISIBLE_DEVICES=0,1 \
|
| 2 |
+
MAX_PIXELS=1003520 \
|
| 3 |
+
swift infer \
|
| 4 |
+
--model Qwen/Qwen2.5-VL-3B-Instruct \
|
| 5 |
+
--infer_backend vllm \
|
| 6 |
+
--val_dataset AI-ModelScope/LaTeX_OCR#1000 \
|
| 7 |
+
--gpu_memory_utilization 0.9 \
|
| 8 |
+
--tensor_parallel_size 2 \
|
| 9 |
+
--max_model_len 32768 \
|
| 10 |
+
--max_new_tokens 2048 \
|
| 11 |
+
--limit_mm_per_prompt '{"image": 5, "video": 2}'
|