Spaces:

AIencoder
/

Axon

Running

AIencoder commited on Jan 26

Commit

d17c108

verified ·

1 Parent(s): 1ecbdcf

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,27 +2,35 @@ FROM python:3.11-slim
 WORKDIR /app
-# Force unbuffered output so logs show immediately
 ENV PYTHONUNBUFFERED=1
 # Install system dependencies
 RUN apt-get update && apt-get install -y \
     ffmpeg \
     && rm -rf /var/lib/apt/lists/*
-# Install your wheel + dependencies
 RUN pip install --no-cache-dir \
-    https://github.com/Ary5272/llama-cpp-python/releases/download/v0.1.1/llama_cpp_python-0.3.16-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.whl \
-    gradio \
     faster-whisper \
     huggingface_hub
-# Create models directory
-RUN mkdir -p /models
-# Copy app
 COPY app.py /app/app.py
 EXPOSE 7860
 CMD ["python", "app.py"]

 WORKDIR /app
+# Prevent Python from buffering stdout/stderr
 ENV PYTHONUNBUFFERED=1
+# Set HuggingFace cache to persistent storage
+ENV HF_HOME=/data/.huggingface
+ENV HF_HUB_CACHE=/data/.huggingface/hub
 # Install system dependencies
 RUN apt-get update && apt-get install -y \
     ffmpeg \
     && rm -rf /var/lib/apt/lists/*
+# Install AVX2-optimized llama-cpp-python wheel (2-3x faster!)
+# Fallback to default build if wheel fails
+RUN pip install --no-cache-dir \
+    https://huggingface.co/datasets/AIencoder/llama-cpp-wheels/resolve/main/llama_cpp_python-0.3.16-cp311-cp311-manylinux_2_31_x86_64.whl \
+    || pip install --no-cache-dir llama-cpp-python
+# Install Python dependencies
 RUN pip install --no-cache-dir \
+    gradio>=5.0.0 \
     faster-whisper \
     huggingface_hub
+# Copy application
 COPY app.py /app/app.py
+# Expose port
 EXPOSE 7860
+# Run the app directly
 CMD ["python", "app.py"]