Spaces:

viskav
/

format

Sleeping

viskav commited on Dec 12, 2025

Commit

4acd6aa

verified ·

1 Parent(s): 73f597e

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,21 +1,48 @@
 FROM python:3.11-slim
-# Install system dependencies needed for llama-cpp-python
 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential \
     cmake \
     && rm -rf /var/lib/apt/lists/*
-# Workdir
-WORKDIR /app
-# Install Python deps
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-# Copy app
-COPY app.py .
 EXPOSE 7860
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

+# ---------------------------------------------------------
+# Dockerfile for HuggingFace Spaces (Custom Docker Runtime)
+# Runs FastAPI + llama-cpp-python + GGUF model
+# ---------------------------------------------------------
 FROM python:3.11-slim
+# Install system dependencies required by llama-cpp-python
 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential \
     cmake \
+    git \
+    wget \
+    libgomp1 \
+    libopenblas-dev \
     && rm -rf /var/lib/apt/lists/*
+# Set the working directory
+WORKDIR /code
+# Copy requirements first (for better Docker cache)
+COPY requirements.txt /code/requirements.txt
+# Install Python dependencies
+RUN pip install --no-cache-dir --upgrade pip \
+    && pip install --no-cache-dir -r /code/requirements.txt
+# Copy application file
+COPY app.py /code/app.py
+# Copy your model folder (GGUF file)
+COPY model /code/model
+# Environment variables for llama.cpp backend
+ENV MODEL_PATH=/code/model/Phi-3.1-mini-4k-instruct-IQ2_M.gguf
+ENV N_THREADS=4
+ENV N_CTX=4096
+ENV N_BATCH=512
+ENV N_GPU_LAYERS=0
+ENV MAX_CONCURRENT_REQUESTS=6
+ENV PYTHONUNBUFFERED=1
+# HuggingFace Spaces requires server to run on port 7860
 EXPOSE 7860
+# Start FastAPI with uvicorn
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]