anews9340 commited on
Commit
c4c2b5b
·
verified ·
1 Parent(s): 7e4778c

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +3 -3
Dockerfile CHANGED
@@ -45,11 +45,11 @@ RUN git clone --depth 1 https://github.com/ggerganov/llama.cpp.git . && \
45
  ENTRYPOINT ["./build/bin/llama-server"]
46
 
47
  CMD [ \
48
- "-hf", "unsloth/Qwen3.5-9B-GGUF:Q8_0", \
49
  "--host", "0.0.0.0", \
50
  "--port", "7860", \
51
  "-t", "8", \
52
  "-c", "4096", \
53
- "--flash-attn", "true"
54
- "--no-mmap" \
55
  ]
 
45
  ENTRYPOINT ["./build/bin/llama-server"]
46
 
47
  CMD [ \
48
+ "-hf", "unsloth/Qwen3.5-4B-GGUF:Q8_0", \
49
  "--host", "0.0.0.0", \
50
  "--port", "7860", \
51
  "-t", "8", \
52
  "-c", "4096", \
53
+ "--flash-attn", "true", \
54
+ "--no-mmap"
55
  ]