QJMKWB commited on
Commit
b6fa1e4
·
verified ·
1 Parent(s): 668cee6

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +10 -0
Dockerfile ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.10
2
+
3
+ # Inštalácia llama-cpp-python (server pre GGUF modely)
4
+ RUN pip install --no-cache-dir llama-cpp-python[server] huggingface_hub
5
+
6
+ # Stiahnutie modelu (Qwen3-Coder-7B v Q4_K_M kvalite - cca 5GB)
7
+ RUN huggingface-cli download bartowski/Qwen2.5-Coder-7B-Instruct-GGUF Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf --local-dir . --local-dir-use-symlinks False
8
+
9
+ # Spustenie API servera kompatibilného s OpenAI
10
+ CMD ["python3", "-m", "llama_cpp.server", "--model", "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf", "--host", "0.0.0.0", "--port", "7860"]