alignmentforever commited on
Commit
d3327e3
·
verified ·
1 Parent(s): acb8cff

Upload deploy_medguide.sh with huggingface_hub

Browse files
Files changed (1) hide show
  1. deploy_medguide.sh +13 -0
deploy_medguide.sh ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
2
+ export VLLM_ALLOW_LONG_MAX_MODEL_LEN=1
3
+ export VLLM_USE_V1=0
4
+ MODEL_PATH='/aifs4su/hansirui_1st/boyuan/medguide_70b_1/slice_3'
5
+ vllm serve $MODEL_PATH \
6
+ --served-model-name medguide \
7
+ --port 8231 \
8
+ --host 0.0.0.0 \
9
+ --dtype bfloat16 \
10
+ --max-model-len 12000 \
11
+ --gpu-memory-utilization 0.9 \
12
+ --tensor-parallel-size 8 \
13
+ --api-key medguide