QJMKWB commited on
Commit
99b3bba
·
verified ·
1 Parent(s): 962cced

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -8
Dockerfile CHANGED
@@ -20,17 +20,16 @@ WORKDIR $HOME/app
20
  RUN pip install --no-cache-dir --upgrade pip
21
  RUN pip install --no-cache-dir huggingface_hub llama-cpp-python[server]
22
 
23
- # Sťahovanie modelu - OPRAVENÝ PRÍKAZ
24
- # Používame --include na špecifikáciu konkrétneho GGUF súboru
25
  RUN huggingface-cli download bartowski/Qwen2.5-Coder-7B-Instruct-GGUF \
26
- Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf \
27
- --local-dir . \
28
- --local-dir-use-symlinks False
29
 
30
- # Spustenie servera
31
- # Pridaný parameter --n_ctx pre kontextové okno (uprav podľa RAM v Space)
32
  CMD ["python3", "-m", "llama_cpp.server", \
33
- "--model", "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf", \
34
  "--host", "0.0.0.0", \
35
  "--port", "7860", \
 
36
  "--chat_format", "chatml"]
 
20
  RUN pip install --no-cache-dir --upgrade pip
21
  RUN pip install --no-cache-dir huggingface_hub llama-cpp-python[server]
22
 
23
+
24
+ # Zmeň v kroku 3 na:
25
  RUN huggingface-cli download bartowski/Qwen2.5-Coder-7B-Instruct-GGUF \
26
+ Qwen2.5-Coder-7B-Instruct-Q8_0.gguf \
27
+ --local-dir . --local-dir-use-symlinks False
 
28
 
29
+ # Zmeň v kroku 4 (CMD) na:
 
30
  CMD ["python3", "-m", "llama_cpp.server", \
31
+ "--model", "Qwen2.5-Coder-7B-Instruct-Q8_0.gguf", \
32
  "--host", "0.0.0.0", \
33
  "--port", "7860", \
34
+ "--n_ctx", "8192", \
35
  "--chat_format", "chatml"]