Spaces:

CooLLaMACEO
/

ChatMPT

Running

CooLLaMACEO commited on Feb 4

Commit

ad08817

verified ·

1 Parent(s): 0122415

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,26 +2,29 @@ FROM python:3.10-slim
 WORKDIR /app
-# Install wget and build tools
 RUN apt-get update && apt-get install -y \
     wget \
-    git \
     && rm -rf /var/lib/apt/lists/*
-# Install Python dependencies
 RUN pip install --no-cache-dir \
     fastapi \
-    uvicorn[standard] \
-    torch \
-    transformers
-# Download model (example GGUF from Hugging Face)
-RUN wget -q -O mpt-7b-q2.gguf \
-    "https://huggingface.co/maddes8cht/mosaicml-mpt-7b-chat-gguf/resolve/main/mosaicml-mpt-7b-chat-Q2_K.gguf?download=true"
-# Copy app
 COPY app.py .
 EXPOSE 7860
 CMD ["python", "app.py"]

 WORKDIR /app
+# 1️⃣ Install system dependencies
 RUN apt-get update && apt-get install -y \
     wget \
+    build-essential \
     && rm -rf /var/lib/apt/lists/*
+# 2️⃣ Install Python dependencies (pre-built llama-cpp-python wheel!)
 RUN pip install --no-cache-dir \
     fastapi \
+    uvicorn \
+    --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu \
+    llama-cpp-python
+# 3️⃣ Download GGUF model (must include tokenizer!)
+# Use a model with tokenizer included. Example:
+RUN wget -q -O mpt-7b-chat.gguf \
+    "https://huggingface.co/mosaicml/mpt-7b-chat-gguf/resolve/main/mpt-7b-chat.Q4_K_M.gguf"
+# 4️⃣ Copy the FastAPI app
 COPY app.py .
+# 5️⃣ Expose port
 EXPOSE 7860
+# 6️⃣ Run the app
 CMD ["python", "app.py"]