Spaces:
Sleeping
Sleeping
Update start.sh
Browse files
start.sh
CHANGED
|
@@ -2,21 +2,18 @@
|
|
| 2 |
set -e
|
| 3 |
|
| 4 |
echo "Starting llama.cpp server..."
|
| 5 |
-
#
|
| 6 |
-
|
| 7 |
-
|
| 8 |
-
$LLAMA_BIN \
|
| 9 |
-m /app/SmolLM2-1.7B-Instruct-Q4_K_M.gguf \
|
| 10 |
--host 0.0.0.0 \
|
| 11 |
--port 8080 \
|
| 12 |
-t 2 \
|
| 13 |
-
-c
|
| 14 |
-
-n 2048 \
|
| 15 |
--log-disable &
|
| 16 |
|
| 17 |
-
echo "Waiting for
|
| 18 |
-
sleep
|
| 19 |
|
| 20 |
-
echo "Starting Gradio
|
| 21 |
-
#
|
| 22 |
/opt/venv/bin/python3 /app/app.py
|
|
|
|
| 2 |
set -e
|
| 3 |
|
| 4 |
echo "Starting llama.cpp server..."
|
| 5 |
+
# The binary is located at /app/llama-server in the ggml-org/llama.cpp image
|
| 6 |
+
/app/llama-server \
|
|
|
|
|
|
|
| 7 |
-m /app/SmolLM2-1.7B-Instruct-Q4_K_M.gguf \
|
| 8 |
--host 0.0.0.0 \
|
| 9 |
--port 8080 \
|
| 10 |
-t 2 \
|
| 11 |
+
-c 2048 \
|
|
|
|
| 12 |
--log-disable &
|
| 13 |
|
| 14 |
+
echo "Waiting for server to initialize..."
|
| 15 |
+
sleep 10
|
| 16 |
|
| 17 |
+
echo "Starting Gradio App..."
|
| 18 |
+
# Explicitly use the venv's python
|
| 19 |
/opt/venv/bin/python3 /app/app.py
|