kiddoos commited on
Commit
adeb19d
·
1 Parent(s): 368cf1c

update application file

Browse files
Files changed (1) hide show
  1. Dockerfile +5 -3
Dockerfile CHANGED
@@ -1,8 +1,10 @@
1
- FROM vllm/vllm-openai:latest
 
 
2
 
3
  WORKDIR /app
4
 
5
  EXPOSE 7860
6
 
7
- ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"]
8
- CMD ["--model", "google/gemma-3-4b-it", "--host", "0.0.0.0", "--port", "7860", "--trust-remote-code"]
 
1
+ FROM ghcr.io/ggml-org/llama.cpp:server
2
+
3
+ ADD https://huggingface.co/unsloth/gemma-3-4b-it-GGUF/resolve/main/gemma-3-4b-it-Q8_0.gguf gemma3-4b.gguf
4
 
5
  WORKDIR /app
6
 
7
  EXPOSE 7860
8
 
9
+ ENTRYPOINT ["/llama-server"]
10
+ CMD ["-m", "/gemma3-4b.gguf", "--host", "0.0.0.0", "--port", "7860", "-n", "-1"]