Spaces:

AIencoder
/

Axon

Running

File size: 882 Bytes

f187c31
125b07b
0b7b535
125b07b
d17c108
8cb66fd
 
d17c108
 
 
 
292dcba
eab1485
733fb2c
b399523
eab1485
5807e15
9bac561
d17c108
d3df5a7
d17c108
 
733fb2c
d17c108
733fb2c
 
eab1485
d17c108
733fb2c
9ac41e6
d17c108
2d07114
125b07b
d17c108
79672fe

FROM python:3.11-slim

WORKDIR /app

# Prevent Python from buffering stdout/stderr
ENV PYTHONUNBUFFERED=1

# Set HuggingFace cache to persistent storage
ENV HF_HOME=/data/.huggingface
ENV HF_HUB_CACHE=/data/.huggingface/hub

# Install system dependencies
RUN apt-get update && apt-get install -y \
    ffmpeg \
    libopenblas0 \
    && rm -rf /var/lib/apt/lists/*

# Install AVX512 + OpenBLAS optimized llama-cpp-python wheel (MAXIMUM SPEED!)
RUN pip install --no-cache-dir \
    https://huggingface.co/datasets/AIencoder/llama-cpp-wheels/resolve/main/llama_cpp_python-0.3.16%2Bopenblas_avx512_vnni-cp311-cp311-manylinux_2_31_x86_64.whl

# Install Python dependencies
RUN pip install --no-cache-dir \
    gradio>=5.0.0 \
    faster-whisper \
    huggingface_hub

# Copy application
COPY app.py /app/app.py

# Expose port
EXPOSE 7860

# Run the app directly
CMD ["python", "app.py"]