gpt

Runtime error

Xlnk commited on Jan 19

Commit

6ea5e99

verified ·

1 Parent(s): 2e44ca0

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -3,7 +3,6 @@ FROM ubuntu:22.04
 ENV DEBIAN_FRONTEND=noninteractive
 WORKDIR /app
-# Dependencies
 RUN apt update && apt install -y \
     git \
     cmake \
@@ -12,24 +11,22 @@ RUN apt update && apt install -y \
     ca-certificates \
     && rm -rf /var/lib/apt/lists/*
-# Clone llama.cpp
 RUN git clone https://github.com/ggerganov/llama.cpp
-# Build llama-server (SINGLE THREAD – SAFE)
 RUN cmake -S llama.cpp -B llama.cpp/build \
     -DLLAMA_BUILD_SERVER=ON \
     -DCMAKE_BUILD_TYPE=Release \
     && cmake --build llama.cpp/build --target llama-server
-    # ⚠️ no -j$(nproc)
-# Models
 RUN mkdir -p /models
-# TinyLlama 1.1B (recommended for HF CPU)
-RUN curl -L -o /models/model.gguf \
 https://huggingface.co/TheBloke/TinyLlama-1.1B-Chat-GGUF/resolve/main/tinyllama-1.1b-chat-q4_k_m.gguf
-# Start script
 COPY start.sh /start.sh
 RUN chmod +x /start.sh

 ENV DEBIAN_FRONTEND=noninteractive
 WORKDIR /app
 RUN apt update && apt install -y \
     git \
     cmake \
     ca-certificates \
     && rm -rf /var/lib/apt/lists/*
 RUN git clone https://github.com/ggerganov/llama.cpp
 RUN cmake -S llama.cpp -B llama.cpp/build \
     -DLLAMA_BUILD_SERVER=ON \
     -DCMAKE_BUILD_TYPE=Release \
     && cmake --build llama.cpp/build --target llama-server
 RUN mkdir -p /models
+# ✅ CORRECT MODEL DOWNLOAD
+RUN curl -L --fail -o /models/model.gguf \
 https://huggingface.co/TheBloke/TinyLlama-1.1B-Chat-GGUF/resolve/main/tinyllama-1.1b-chat-q4_k_m.gguf
+# ✅ VERIFY GGUF
+RUN head -c 4 /models/model.gguf | xxd
 COPY start.sh /start.sh
 RUN chmod +x /start.sh