Spaces:
Sleeping
Sleeping
Update start.sh
Browse files
start.sh
CHANGED
|
@@ -36,22 +36,20 @@ except Exception as e:
|
|
| 36 |
# 1. TEXT: Qwen 2.5 Coder
|
| 37 |
download_model "Qwen/Qwen2.5-Coder-14B-Instruct-GGUF" "qwen2.5-coder-14b-instruct-q4_k_m.gguf"
|
| 38 |
|
| 39 |
-
# 2. IMAGE: Qwen 2.5 VL (
|
| 40 |
download_model "ggml-org/Qwen2.5-VL-7B-Instruct-GGUF" "Qwen2.5-VL-7B-Instruct-Q4_K_M.gguf" "qwen2.5-vl-7b-instruct-q4_k_m.gguf"
|
| 41 |
|
| 42 |
# 3. AUDIO: Qwen 2 Audio
|
| 43 |
download_model "gaianet/Qwen2-Audio-7B-Instruct-GGUF" "Qwen2-Audio-7B-Instruct-Q4_K_M.gguf" "qwen2-audio-7b-instruct-q4_k_m.gguf"
|
| 44 |
|
| 45 |
echo "------------------------------------------------"
|
| 46 |
-
echo "🚀 Starting Server"
|
| 47 |
echo "------------------------------------------------"
|
| 48 |
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
echo "Selected Model: $MODEL_FILE"
|
| 52 |
-
|
| 53 |
exec /usr/local/bin/llama-server \
|
| 54 |
-
-
|
|
|
|
| 55 |
--host 0.0.0.0 \
|
| 56 |
--port 7860 \
|
| 57 |
-c 8192 \
|
|
|
|
| 36 |
# 1. TEXT: Qwen 2.5 Coder
|
| 37 |
download_model "Qwen/Qwen2.5-Coder-14B-Instruct-GGUF" "qwen2.5-coder-14b-instruct-q4_k_m.gguf"
|
| 38 |
|
| 39 |
+
# 2. IMAGE: Qwen 2.5 VL (correct case-sensitive filename)
|
| 40 |
download_model "ggml-org/Qwen2.5-VL-7B-Instruct-GGUF" "Qwen2.5-VL-7B-Instruct-Q4_K_M.gguf" "qwen2.5-vl-7b-instruct-q4_k_m.gguf"
|
| 41 |
|
| 42 |
# 3. AUDIO: Qwen 2 Audio
|
| 43 |
download_model "gaianet/Qwen2-Audio-7B-Instruct-GGUF" "Qwen2-Audio-7B-Instruct-Q4_K_M.gguf" "qwen2-audio-7b-instruct-q4_k_m.gguf"
|
| 44 |
|
| 45 |
echo "------------------------------------------------"
|
| 46 |
+
echo "🚀 Starting Server in Router Mode"
|
| 47 |
echo "------------------------------------------------"
|
| 48 |
|
| 49 |
+
# Start in ROUTER MODE - serve all models from /app/models
|
|
|
|
|
|
|
|
|
|
| 50 |
exec /usr/local/bin/llama-server \
|
| 51 |
+
--models-dir /app/models \
|
| 52 |
+
--models-max 3 \
|
| 53 |
--host 0.0.0.0 \
|
| 54 |
--port 7860 \
|
| 55 |
-c 8192 \
|