Update Dockerfile
Browse files- Dockerfile +9 -8
Dockerfile
CHANGED
|
@@ -17,8 +17,7 @@ RUN apt-get update && \
|
|
| 17 |
wget && \
|
| 18 |
rm -rf /var/lib/apt/lists/*
|
| 19 |
|
| 20 |
-
# Install Python dependencies
|
| 21 |
-
# Added hf_transfer for faster, more reliable downloads
|
| 22 |
RUN pip3 install huggingface-hub[hf_transfer] openai gradio duckduckgo-search
|
| 23 |
|
| 24 |
# Build llama.cpp
|
|
@@ -27,16 +26,18 @@ RUN git clone https://github.com/ggerganov/llama.cpp && \
|
|
| 27 |
cmake -B build -S . -DLLAMA_BUILD_SERVER=ON -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_BUILD_TYPE=Release && \
|
| 28 |
cmake --build build --config Release --target llama-server -j $(nproc)
|
| 29 |
|
| 30 |
-
# Download
|
|
|
|
| 31 |
RUN mkdir -p /models && \
|
| 32 |
HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download \
|
| 33 |
-
|
| 34 |
-
|
| 35 |
--local-dir /models \
|
| 36 |
-
--local-dir-use-symlinks False
|
| 37 |
-
|
|
|
|
|
|
|
| 38 |
|
| 39 |
-
# Copy app and startup script
|
| 40 |
COPY app.py /app.py
|
| 41 |
COPY start.sh /start.sh
|
| 42 |
RUN chmod +x /start.sh
|
|
|
|
| 17 |
wget && \
|
| 18 |
rm -rf /var/lib/apt/lists/*
|
| 19 |
|
| 20 |
+
# Install Python dependencies with transfer acceleration
|
|
|
|
| 21 |
RUN pip3 install huggingface-hub[hf_transfer] openai gradio duckduckgo-search
|
| 22 |
|
| 23 |
# Build llama.cpp
|
|
|
|
| 26 |
cmake -B build -S . -DLLAMA_BUILD_SERVER=ON -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_BUILD_TYPE=Release && \
|
| 27 |
cmake --build build --config Release --target llama-server -j $(nproc)
|
| 28 |
|
| 29 |
+
# Download from official Qwen GGUF repo
|
| 30 |
+
# We target the Q8_0 file for high precision
|
| 31 |
RUN mkdir -p /models && \
|
| 32 |
HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download \
|
| 33 |
+
Qwen/Qwen3-0.6B-GGUF \
|
| 34 |
+
--include "*q8_0.gguf" \
|
| 35 |
--local-dir /models \
|
| 36 |
+
--local-dir-use-symlinks False
|
| 37 |
+
|
| 38 |
+
# Rename the file to a standard name for our startup script
|
| 39 |
+
RUN find /models -name "*.gguf" -exec mv {} /models/model.gguf \;
|
| 40 |
|
|
|
|
| 41 |
COPY app.py /app.py
|
| 42 |
COPY start.sh /start.sh
|
| 43 |
RUN chmod +x /start.sh
|