Spaces:

CooLLaMACEO
/

ChatGPTOpenSource1.0

Running

CooLLaMACEO commited on Feb 4

Commit

9a444d0

verified ·

1 Parent(s): 494bc63

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,20 +1,20 @@
-# Base image
-FROM python:3.11-slim
 WORKDIR /app
-# Install wget (needed for the model)
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
-# 1. Install PREBUILT llama-cpp-python directly via URL
-# This specific wheel is for Linux x86_64 and Python 3.11
 RUN pip install --no-cache-dir \
-    https://github.com/abetlen/llama-cpp-python/releases/download/v0.3.16/llama_cpp_python-0.3.16-cp311-cp311-manylinux_2_17_x86_64.whl
 # 2. Install web dependencies
 RUN pip install --no-cache-dir fastapi uvicorn[standard] requests
-# 3. Setup models directory and download GPT-OSS-20B
 RUN mkdir -p ./models
 RUN wget -q -O ./models/gpt-oss-20b-Q3_K_M.gguf \
     https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q3_K_M.gguf

+# We switch to 3.10 to match the most stable community prebuilt wheels
+FROM python:3.10-slim
 WORKDIR /app
+# Install system essentials
 RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
+# 1. Install PREBUILT llama-cpp-python (Community HF Space version)
+# This wheel is optimized for the HF Free Tier (16GB RAM)
 RUN pip install --no-cache-dir \
+    https://huggingface.co/Luigi/llama-cpp-python-wheels-hf-spaces-free-cpu/resolve/main/llama_cpp_python-0.3.22-cp310-cp310-linux_x86_64.whl
 # 2. Install web dependencies
 RUN pip install --no-cache-dir fastapi uvicorn[standard] requests
+# 3. Setup models folder and download GPT-OSS-20B
 RUN mkdir -p ./models
 RUN wget -q -O ./models/gpt-oss-20b-Q3_K_M.gguf \
     https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q3_K_M.gguf