File size: 471 Bytes
adeb19d
 
368cf1c
 
2f08f4c
 
d0791b8
368cf1c
 
0906be4
d0791b8
2f08f4c
1
2
3
4
5
6
7
8
9
10
11
12
13
FROM ghcr.io/ggml-org/llama.cpp:server

WORKDIR /app

ADD https://huggingface.co/ggml-org/gemma-3-4b-it-GGUF/resolve/main/gemma-3-4b-it-Q4_K_M.gguf /app/gemma-3-4b-it-Q4_K_M.gguf
ADD https://huggingface.co/ggml-org/gemma-3-4b-it-GGUF/resolve/main/mmproj-model-f16.gguf /app/mmproj-model-f16.gguf

EXPOSE 7860

ENTRYPOINT ["/app/llama-server"]

CMD ["--host", "0.0.0.0", "--port", "7860", "-m", "/app/gemma-3-4b-it-Q4_K_M.gguf", "--mmproj", "/app/mmproj-model-f16.gguf" ]