Sumkh commited on
Commit
3cbd702
·
verified ·
1 Parent(s): e489746

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +3 -3
start.sh CHANGED
@@ -8,12 +8,12 @@ mkdir -p /app/.cache
8
  export USER_AGENT="vllm_huggingface_space"
9
 
10
  # Launch the vLLM server with the model tag as a positional argument
11
- vllm serve unsloth/llama-3-8b-Instruct-bnb-4bit \
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
- --quantization bitsandbytes \
16
- --load-format bitsandbytes \
17
  --dtype half \
18
  --enforce-eager \
19
  --max-model-len 8192 &
 
8
  export USER_AGENT="vllm_huggingface_space"
9
 
10
  # Launch the vLLM server with the model tag as a positional argument
11
+ vllm serve MaziyarPanahi/Meta-Llama-3-70B-Instruct-GGUF \
12
  --enable-auto-tool-choice \
13
  --tool-call-parser llama3_json \
14
  --chat-template examples/tool_chat_template_llama3.1_json.jinja \
15
+ --quantization gguf \
16
+ --load-format gguf \
17
  --dtype half \
18
  --enforce-eager \
19
  --max-model-len 8192 &