Spaces:

CooLLaMACEO
/

ChatMPT

Running

CooLLaMACEO commited on Feb 4

Commit

5b14eba

verified ·

1 Parent(s): 2142f68

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,21 +2,21 @@ FROM python:3.10-slim
 WORKDIR /app
-# 1. Install wget
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
-# 2. Install pre-built llama-cpp (NO BUILDING HANGS)
-RUN pip install --no-cache-dir \
-    fastapi \
-    uvicorn \
     --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu \
-    llama-cpp-python
-# 3. Download MPT-7B Q2 as 'model.gguf' (Matches your script)
 RUN wget -q -O model.gguf \
     "https://huggingface.co/maddes8cht/mosaicml-mpt-7b-chat-gguf/resolve/main/mosaicml-mpt-7b-chat-Q2_K.gguf?download=true"
-# 4. Copy the script you found
 COPY app.py .
 EXPOSE 7860

 WORKDIR /app
+# 1. Install wget (essential for the model)
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
+# 2. Install llama-cpp-python FORCING the binary (No compilation allowed)
+# We use version 0.2.76 as it is highly stable for MPT models
+RUN pip install --no-cache-dir fastapi uvicorn
+RUN pip install llama-cpp-python==0.2.76 \
     --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu \
+    --prefer-binary
+# 3. Download the model silently
 RUN wget -q -O model.gguf \
     "https://huggingface.co/maddes8cht/mosaicml-mpt-7b-chat-gguf/resolve/main/mosaicml-mpt-7b-chat-Q2_K.gguf?download=true"
+# 4. Copy your script
 COPY app.py .
 EXPOSE 7860