Spaces:
Sleeping
Sleeping
Update Dockerfile
Browse files- Dockerfile +12 -2
Dockerfile
CHANGED
|
@@ -2,8 +2,18 @@ FROM ghcr.io/ggml-org/llama.cpp:server
|
|
| 2 |
|
| 3 |
ENV LLAMA_CACHE=/tmp/llama-cache
|
| 4 |
ENV HF_HUB_CACHE=/tmp/hf-cache
|
| 5 |
-
ENV LLAMA_ARG_WEBUI=1
|
| 6 |
|
| 7 |
EXPOSE 7860
|
| 8 |
|
| 9 |
-
CMD ["-hf", "unsloth/gemma-4-E2B-it-GGUF:Q4_0",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
|
| 3 |
ENV LLAMA_CACHE=/tmp/llama-cache
|
| 4 |
ENV HF_HUB_CACHE=/tmp/hf-cache
|
|
|
|
| 5 |
|
| 6 |
EXPOSE 7860
|
| 7 |
|
| 8 |
+
CMD ["-hf", "unsloth/gemma-4-E2B-it-GGUF:Q4_0", \
|
| 9 |
+
"-c", "2048", \
|
| 10 |
+
"-t", "8", \
|
| 11 |
+
"-tb", "16", \
|
| 12 |
+
"-b", "1024", \
|
| 13 |
+
"-ub", "512", \
|
| 14 |
+
"-np", "1", \
|
| 15 |
+
"--flash-attn", \
|
| 16 |
+
"--no-warmup", \
|
| 17 |
+
"--no-context-shift", \
|
| 18 |
+
"--host", "0.0.0.0", \
|
| 19 |
+
"--port", "7860"]
|