OrbitMC commited on
Commit
8450b02
·
verified ·
1 Parent(s): f082b76

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +9 -8
Dockerfile CHANGED
@@ -17,8 +17,7 @@ RUN apt-get update && \
17
  wget && \
18
  rm -rf /var/lib/apt/lists/*
19
 
20
- # Install Python dependencies
21
- # Added hf_transfer for faster, more reliable downloads
22
  RUN pip3 install huggingface-hub[hf_transfer] openai gradio duckduckgo-search
23
 
24
  # Build llama.cpp
@@ -27,16 +26,18 @@ RUN git clone https://github.com/ggerganov/llama.cpp && \
27
  cmake -B build -S . -DLLAMA_BUILD_SERVER=ON -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_BUILD_TYPE=Release && \
28
  cmake --build build --config Release --target llama-server -j $(nproc)
29
 
30
- # Download model using huggingface-cli (more stable than wget)
 
31
  RUN mkdir -p /models && \
32
  HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download \
33
- unsloth/Qwen3-0.6B-GGUF \
34
- Qwen3-0.6B-UD-Q8_K_XL.gguf \
35
  --local-dir /models \
36
- --local-dir-use-symlinks False && \
37
- mv /models/Qwen3-0.6B-UD-Q8_K_XL.gguf /models/model.q8_k_xl.gguf
 
 
38
 
39
- # Copy app and startup script
40
  COPY app.py /app.py
41
  COPY start.sh /start.sh
42
  RUN chmod +x /start.sh
 
17
  wget && \
18
  rm -rf /var/lib/apt/lists/*
19
 
20
+ # Install Python dependencies with transfer acceleration
 
21
  RUN pip3 install huggingface-hub[hf_transfer] openai gradio duckduckgo-search
22
 
23
  # Build llama.cpp
 
26
  cmake -B build -S . -DLLAMA_BUILD_SERVER=ON -DGGML_BLAS=ON -DGGML_BLAS_VENDOR=OpenBLAS -DCMAKE_BUILD_TYPE=Release && \
27
  cmake --build build --config Release --target llama-server -j $(nproc)
28
 
29
+ # Download from official Qwen GGUF repo
30
+ # We target the Q8_0 file for high precision
31
  RUN mkdir -p /models && \
32
  HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download \
33
+ Qwen/Qwen3-0.6B-GGUF \
34
+ --include "*q8_0.gguf" \
35
  --local-dir /models \
36
+ --local-dir-use-symlinks False
37
+
38
+ # Rename the file to a standard name for our startup script
39
+ RUN find /models -name "*.gguf" -exec mv {} /models/model.gguf \;
40
 
 
41
  COPY app.py /app.py
42
  COPY start.sh /start.sh
43
  RUN chmod +x /start.sh