dload model
Browse files- Dockerfile +5 -1
Dockerfile
CHANGED
|
@@ -10,6 +10,7 @@ RUN apt-get update && apt-get install -y \
|
|
| 10 |
curl \
|
| 11 |
pkg-config \
|
| 12 |
git \
|
|
|
|
| 13 |
&& rm -rf /var/lib/apt/lists/*
|
| 14 |
|
| 15 |
# Install Python deps — compile llama-cpp-python with OpenBLAS
|
|
@@ -18,12 +19,15 @@ RUN CMAKE_ARGS="-DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS" \
|
|
| 18 |
FORCE_CMAKE=1 \
|
| 19 |
pip install --no-cache-dir -r requirements.txt
|
| 20 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
COPY app.py .
|
| 22 |
|
| 23 |
# HuggingFace Spaces expects port 7860
|
| 24 |
EXPOSE 7860
|
| 25 |
|
| 26 |
-
# Set SPACE_URL at runtime via HF Space secrets/env vars
|
| 27 |
ENV SPACE_URL=""
|
| 28 |
ENV N_CTX="4096"
|
| 29 |
ENV N_THREADS="2"
|
|
|
|
| 10 |
curl \
|
| 11 |
pkg-config \
|
| 12 |
git \
|
| 13 |
+
wget \
|
| 14 |
&& rm -rf /var/lib/apt/lists/*
|
| 15 |
|
| 16 |
# Install Python deps — compile llama-cpp-python with OpenBLAS
|
|
|
|
| 19 |
FORCE_CMAKE=1 \
|
| 20 |
pip install --no-cache-dir -r requirements.txt
|
| 21 |
|
| 22 |
+
# Download the model during build
|
| 23 |
+
RUN mkdir -p /app/models && \
|
| 24 |
+
wget -q https://huggingface.co/unsloth/gemma-4-26B-A4B-it-GGUF/resolve/main/gemma-4-26B-A4B-it-UD-IQ3_XXS.gguf -O /app/models/gemma-4-26B-A4B-it-UD-IQ3_XXS.gguf
|
| 25 |
+
|
| 26 |
COPY app.py .
|
| 27 |
|
| 28 |
# HuggingFace Spaces expects port 7860
|
| 29 |
EXPOSE 7860
|
| 30 |
|
|
|
|
| 31 |
ENV SPACE_URL=""
|
| 32 |
ENV N_CTX="4096"
|
| 33 |
ENV N_THREADS="2"
|