Spaces:
Sleeping
Sleeping
Create Dockerfile
Browse files- Dockerfile +10 -0
Dockerfile
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM python:3.10
|
| 2 |
+
|
| 3 |
+
# Inštalácia llama-cpp-python (server pre GGUF modely)
|
| 4 |
+
RUN pip install --no-cache-dir llama-cpp-python[server] huggingface_hub
|
| 5 |
+
|
| 6 |
+
# Stiahnutie modelu (Qwen3-Coder-7B v Q4_K_M kvalite - cca 5GB)
|
| 7 |
+
RUN huggingface-cli download bartowski/Qwen2.5-Coder-7B-Instruct-GGUF Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf --local-dir . --local-dir-use-symlinks False
|
| 8 |
+
|
| 9 |
+
# Spustenie API servera kompatibilného s OpenAI
|
| 10 |
+
CMD ["python3", "-m", "llama_cpp.server", "--model", "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf", "--host", "0.0.0.0", "--port", "7860"]
|