gpt

Runtime error

Xlnk commited on Jan 19

Commit

89b549f

verified ·

1 Parent(s): fd21230

Create Dockerfile

Files changed (1) hide show

Dockerfile ADDED Viewed

+FROM ubuntu:22.04
+ENV DEBIAN_FRONTEND=noninteractive
+WORKDIR /app
+# Install dependencies
+RUN apt update && apt install -y \
+    git \
+    cmake \
+    build-essential \
+    curl \
+    ca-certificates \
+    && rm -rf /var/lib/apt/lists/*
+# Clone llama.cpp
+RUN git clone https://github.com/ggerganov/llama.cpp
+# Build llama-server
+RUN cmake -S llama.cpp -B llama.cpp/build \
+    -DLLAMA_BUILD_SERVER=ON \
+    -DCMAKE_BUILD_TYPE=Release \
+    && cmake --build llama.cpp/build --target llama-server -j$(nproc)
+# Create model directory
+RUN mkdir -p /models
+# Download a GGUF model (example: Qwen 0.5B)
+RUN curl -L -o /models/model.gguf \
+https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q4_k_m.gguf
+# Copy start script
+COPY start.sh /start.sh
+RUN chmod +x /start.sh
+EXPOSE 7860
+CMD ["/start.sh"]