File size: 238 Bytes
b24e544
 
 
 
 
 
208f694
 
 
4c84370
b4e7f48
4c84370
 
1
2
3
4
5
6
7
8
9
10
11
12
13
#!/bin/bash

/app/llama.cpp/build/bin/llama-server \
  --model /models/model.gguf \
  --host 0.0.0.0 \
  --port 7860 \
  --fit off \
  --threads $(nproc) \
  --mlock \
  --no-mmap \
  -c 262144 \
  --rope-scaling yarn \
  --rope-scale 16