Spaces:
Running
Running
File size: 698 Bytes
d9391a5 03b7db6 539d6c7 482fec8 539d6c7 d9391a5 03b7db6 3bdbd6b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 | FROM ghcr.io/ggml-org/llama.cpp:server@sha256:a9b230ae078a6dd947ede5825f227af9fc5fc9e126c4717bebd4762c02601285
RUN useradd -m -u 1000 user
USER user
ENV HOME=/home/user
ENV PATH=/home/user/.local/bin:$PATH
WORKDIR /app
ADD --chown=user https://huggingface.co/Intel/Qwen3-Coder-30B-A3B-Instruct-gguf-q2ks-mixed-AutoRound/resolve/main/Qwen3-Coder-30B-A3B-Instruct-128x1.8B-Q2_K_S.gguf /app/model.gguf
EXPOSE 7860
CMD ["--port", "7860", "--no-mmap", "--flash-attn", "on", "--fit", "on", "--ctx-size", "8192", "--samplers", "min_p", "--min-p", "0.005", "--backend-sampling", "--webui-mcp-proxy", "-m", "/app/model.gguf", "--chat-template-kwargs", "{ \"enable_thinking\": false }", "--no-mmproj"]
|