James040 commited on
Commit
aee66c6
·
verified ·
1 Parent(s): 7f98ba3

Update start.sh

Browse files
Files changed (1) hide show
  1. start.sh +7 -10
start.sh CHANGED
@@ -2,21 +2,18 @@
2
  set -e
3
 
4
  echo "Starting llama.cpp server..."
5
- # Direct path for the ghcr.io/ggml-org/llama.cpp:full image
6
- LLAMA_BIN="/app/llama-server"
7
-
8
- $LLAMA_BIN \
9
  -m /app/SmolLM2-1.7B-Instruct-Q4_K_M.gguf \
10
  --host 0.0.0.0 \
11
  --port 8080 \
12
  -t 2 \
13
- -c 4096 \
14
- -n 2048 \
15
  --log-disable &
16
 
17
- echo "Waiting for llama.cpp to be ready..."
18
- sleep 15
19
 
20
- echo "Starting Gradio app using venv..."
21
- # Use the full path to the venv python to be 100% sure
22
  /opt/venv/bin/python3 /app/app.py
 
2
  set -e
3
 
4
  echo "Starting llama.cpp server..."
5
+ # The binary is located at /app/llama-server in the ggml-org/llama.cpp image
6
+ /app/llama-server \
 
 
7
  -m /app/SmolLM2-1.7B-Instruct-Q4_K_M.gguf \
8
  --host 0.0.0.0 \
9
  --port 8080 \
10
  -t 2 \
11
+ -c 2048 \
 
12
  --log-disable &
13
 
14
+ echo "Waiting for server to initialize..."
15
+ sleep 10
16
 
17
+ echo "Starting Gradio App..."
18
+ # Explicitly use the venv's python
19
  /opt/venv/bin/python3 /app/app.py