Sumkh commited on
Commit
19ad6b0
·
verified ·
1 Parent(s): 5c87648

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +1 -0
start.sh CHANGED
@@ -14,6 +14,7 @@ vllm serve unsloth/llama-3-70b-Instruct-bnb-4bit \
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
  --quantization bitsandbytes \
16
  --load-format bitsandbytes \
 
17
  --enforce-eager &
18
 
19
  # Wait to ensure the vLLM server is fully started (adjust if needed)
 
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
  --quantization bitsandbytes \
16
  --load-format bitsandbytes \
17
+ --gpu_memory_utilization 0.9 \
18
  --enforce-eager &
19
 
20
  # Wait to ensure the vLLM server is fully started (adjust if needed)