Duplicated from Xlnk/gpt
902996c 5038df1 9777610
1
2
3
4
5
6
7
8
9
10
#!/bin/bash /app/llama.cpp/build/bin/llama-server \ --model /models/model.gguf \ --host 0.0.0.0 \ --port 7860 \ --fit off \ --threads $(nproc) \ --mlock \ --no-mmap \