Sumkh commited on
Commit
32c3e70
·
verified ·
1 Parent(s): f625bfd

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +1 -0
start.sh CHANGED
@@ -15,6 +15,7 @@ vllm serve unsloth/llama-3-8b-Instruct-bnb-4bit \
15
  --quantization bitsandbytes \
16
  --load-format bitsandbytes \
17
  --dtype half \
 
18
  --max-model-len 8192 &
19
 
20
  # Wait to ensure the vLLM server is fully started (adjust if needed)
 
15
  --quantization bitsandbytes \
16
  --load-format bitsandbytes \
17
  --dtype half \
18
+ --enforce-eager \
19
  --max-model-len 8192 &
20
 
21
  # Wait to ensure the vLLM server is fully started (adjust if needed)