AIencoder commited on
Commit
b57cd88
·
verified ·
1 Parent(s): 9abf1d5

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +5 -7
start.sh CHANGED
@@ -36,22 +36,20 @@ except Exception as e:
36
  # 1. TEXT: Qwen 2.5 Coder
37
  download_model "Qwen/Qwen2.5-Coder-14B-Instruct-GGUF" "qwen2.5-coder-14b-instruct-q4_k_m.gguf"
38
 
39
- # 2. IMAGE: Qwen 2.5 VL (FIXED: correct case-sensitive filename)
40
  download_model "ggml-org/Qwen2.5-VL-7B-Instruct-GGUF" "Qwen2.5-VL-7B-Instruct-Q4_K_M.gguf" "qwen2.5-vl-7b-instruct-q4_k_m.gguf"
41
 
42
  # 3. AUDIO: Qwen 2 Audio
43
  download_model "gaianet/Qwen2-Audio-7B-Instruct-GGUF" "Qwen2-Audio-7B-Instruct-Q4_K_M.gguf" "qwen2-audio-7b-instruct-q4_k_m.gguf"
44
 
45
  echo "------------------------------------------------"
46
- echo "🚀 Starting Server"
47
  echo "------------------------------------------------"
48
 
49
- MODEL_FILE="/app/models/qwen2.5-coder-14b-instruct-q4_k_m.gguf"
50
-
51
- echo "Selected Model: $MODEL_FILE"
52
-
53
  exec /usr/local/bin/llama-server \
54
- -m "$MODEL_FILE" \
 
55
  --host 0.0.0.0 \
56
  --port 7860 \
57
  -c 8192 \
 
36
  # 1. TEXT: Qwen 2.5 Coder
37
  download_model "Qwen/Qwen2.5-Coder-14B-Instruct-GGUF" "qwen2.5-coder-14b-instruct-q4_k_m.gguf"
38
 
39
+ # 2. IMAGE: Qwen 2.5 VL (correct case-sensitive filename)
40
  download_model "ggml-org/Qwen2.5-VL-7B-Instruct-GGUF" "Qwen2.5-VL-7B-Instruct-Q4_K_M.gguf" "qwen2.5-vl-7b-instruct-q4_k_m.gguf"
41
 
42
  # 3. AUDIO: Qwen 2 Audio
43
  download_model "gaianet/Qwen2-Audio-7B-Instruct-GGUF" "Qwen2-Audio-7B-Instruct-Q4_K_M.gguf" "qwen2-audio-7b-instruct-q4_k_m.gguf"
44
 
45
  echo "------------------------------------------------"
46
+ echo "🚀 Starting Server in Router Mode"
47
  echo "------------------------------------------------"
48
 
49
+ # Start in ROUTER MODE - serve all models from /app/models
 
 
 
50
  exec /usr/local/bin/llama-server \
51
+ --models-dir /app/models \
52
+ --models-max 3 \
53
  --host 0.0.0.0 \
54
  --port 7860 \
55
  -c 8192 \