yuccaaa commited on
Commit
95db7d3
·
verified ·
1 Parent(s): c8d85de

Upload ms-swift/examples/infer/vllm/mllm_tp.sh with huggingface_hub

Browse files
ms-swift/examples/infer/vllm/mllm_tp.sh ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDA_VISIBLE_DEVICES=0,1 \
2
+ MAX_PIXELS=1003520 \
3
+ swift infer \
4
+ --model Qwen/Qwen2.5-VL-3B-Instruct \
5
+ --infer_backend vllm \
6
+ --val_dataset AI-ModelScope/LaTeX_OCR#1000 \
7
+ --gpu_memory_utilization 0.9 \
8
+ --tensor_parallel_size 2 \
9
+ --max_model_len 32768 \
10
+ --max_new_tokens 2048 \
11
+ --limit_mm_per_prompt '{"image": 5, "video": 2}'