moevis commited on
Commit
9187b40
·
verified ·
1 Parent(s): dd84d1d

Update start_services.sh

Browse files
Files changed (1) hide show
  1. start_services.sh +2 -2
start_services.sh CHANGED
@@ -40,9 +40,9 @@ python3 -m vllm.entrypoints.openai.api_server \
40
  --model "$MODEL_DIR" \
41
  --port "$API_PORT" \
42
  --host 0.0.0.0 \
43
- --max-model-len 8192 \
44
  --tensor-parallel-size 4 \
45
- --gpu-memory-utilization 0.97 \
46
  --trust-remote-code \
47
  --interleave-mm-strings \
48
  --served-model-name Step-Audio-R1 \
 
40
  --model "$MODEL_DIR" \
41
  --port "$API_PORT" \
42
  --host 0.0.0.0 \
43
+ --max-model-len 7192 \
44
  --tensor-parallel-size 4 \
45
+ --gpu-memory-utilization 0.92 \
46
  --trust-remote-code \
47
  --interleave-mm-strings \
48
  --served-model-name Step-Audio-R1 \