File size: 398 Bytes
f00f318 26f3ec9 7c204ea 8937aa2 f02f4b1 01b2896 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 | FROM ghcr.io/ggml-org/llama.cpp:full
RUN apt update && apt install wget -y
RUN wget "https://huggingface.co/Qwen/Qwen3-8B-GGUF/resolve/main/Qwen3-8B-Q4_K_M.gguf" -O /Qwen3-8B-Q4_K_M.gguf
CMD ["--server", \
"-m", "/Qwen3-8B-Q4_K_M.gguf", \
"--port", "7860", \
"--host", "0.0.0.0", \
"--ctx-size", "32768", \
"--n-predict", "-1", \
"--threads", "2", \
"--jinja"] |