Spaces:

CooLLaMACEO
/

ChatGPTOpenSource1.0

Running

CooLLaMACEO commited on Feb 4

Commit

494bc63

verified ·

1 Parent(s): 3718e07

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -3,18 +3,18 @@ FROM python:3.11-slim
 WORKDIR /app
-# We still need wget for the model, but we can skip the heavy compilers!
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
-# 1. Install pre-built llama-cpp-python (CPU version)
-# This bypasses the "Building wheel..." stage entirely
-RUN pip install llama-cpp-python \
-    --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
-# 2. Install your other web tools
 RUN pip install --no-cache-dir fastapi uvicorn[standard] requests
-# 3. Setup models
 RUN mkdir -p ./models
 RUN wget -q -O ./models/gpt-oss-20b-Q3_K_M.gguf \
     https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q3_K_M.gguf

 WORKDIR /app
+# Install wget (needed for the model)
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
+# 1. Install PREBUILT llama-cpp-python directly via URL
+# This specific wheel is for Linux x86_64 and Python 3.11
+RUN pip install --no-cache-dir \
+    https://github.com/abetlen/llama-cpp-python/releases/download/v0.3.16/llama_cpp_python-0.3.16-cp311-cp311-manylinux_2_17_x86_64.whl
+# 2. Install web dependencies
 RUN pip install --no-cache-dir fastapi uvicorn[standard] requests
+# 3. Setup models directory and download GPT-OSS-20B
 RUN mkdir -p ./models
 RUN wget -q -O ./models/gpt-oss-20b-Q3_K_M.gguf \
     https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q3_K_M.gguf