Spaces:

owlninjam
/

spacecx

Paused

owlninjam commited on Aug 7, 2025

Commit

e366f1f

verified ·

1 Parent(s): 575e1e8

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,26 +2,30 @@ FROM python:3.11-slim
 WORKDIR /app
-# Install dependencies
 RUN apt-get update && apt-get install -y \
-    build-essential wget git cmake \
     && rm -rf /var/lib/apt/lists/*
 # Clone llama.cpp
 RUN git clone https://github.com/ggerganov/llama.cpp
-# Build with cmake
 WORKDIR /app/llama.cpp
-RUN cmake -B build && cmake --build build --config Release
-# Go back to /app
 WORKDIR /app
-# Copy app files
 COPY app.py .
-# Expose port
 EXPOSE 7860
-# Run app
-CMD ["python", "app.py"]

 WORKDIR /app
+# Install dependencies for building llama.cpp with HTTP server support
 RUN apt-get update && apt-get install -y \
+    build-essential wget git cmake libcurl4-openssl-dev \
     && rm -rf /var/lib/apt/lists/*
 # Clone llama.cpp
 RUN git clone https://github.com/ggerganov/llama.cpp
+# Build llama.cpp with CURL enabled
 WORKDIR /app/llama.cpp
+RUN cmake -B build -DLLAMA_CURL=ON && cmake --build build --config Release
+# Back to /app
 WORKDIR /app
+# Copy Python app
 COPY app.py .
+# Download model file
+RUN wget -O /app/model.gguf \
+    https://huggingface.co/TheBloke/CapybaraHermes-2.5-Mistral-7B-GGUF/resolve/main/capybarahermes-2.5-mistral-7b.Q5_K_M.gguf
+# Expose the llama.cpp HTTP server port
 EXPOSE 7860
+# Run the HTTP server
+CMD ["/app/llama.cpp/build/bin/llama-server", "-m", "/app/model.gguf", "-c", "2048", "-t", "2", "--host", "0.0.0.0", "--port", "7860"]