Spaces:

viskav
/

format

Sleeping

viskav commited on Dec 13, 2025

Commit

0a29f38

verified ·

1 Parent(s): 67a0f44

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,23 +2,30 @@ FROM python:3.10-slim
 WORKDIR /code
-# Install build dependencies for llama-cpp-python
 RUN apt-get update && apt-get install -y \
     build-essential \
-    git \
     cmake \
     && rm -rf /var/lib/apt/lists/*
 # Copy requirements first
 COPY requirements.txt .
-# Install with specific BLAS backend for better performance
-RUN CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS" \
-    pip install --no-cache-dir -r requirements.txt
 # Copy app
 COPY app.py .
 EXPOSE 7860
-CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

 WORKDIR /code
+# Install ONLY essential build dependencies
 RUN apt-get update && apt-get install -y \
     build-essential \
     cmake \
+    libopenblas-dev \
     && rm -rf /var/lib/apt/lists/*
 # Copy requirements first
 COPY requirements.txt .
+# Install with OpenBLAS optimization (CRITICAL FOR SPEED)
+ENV CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS"
+RUN pip install --no-cache-dir -r requirements.txt
 # Copy app
 COPY app.py .
+# Environment optimizations
+ENV PYTHONUNBUFFERED=1
+ENV N_THREADS=8
+ENV N_CTX=512
+ENV N_BATCH=256
 EXPOSE 7860
+# Use uvicorn directly with optimized workers
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]