andrew-speech-agent / Dockerfile
andrewchernish1-ui
fix: use faster-whisper model and add accelerate
70c01d1
FROM python:3.10-slim
ENV PYTHONDONTWRITEBYTECODE=1 \
PYTHONUNBUFFERED=1
WORKDIR /app
RUN apt-get update && \
apt-get install -y --no-install-recommends \
ffmpeg \
build-essential \
git \
pkg-config \
libavcodec-dev \
libavdevice-dev \
libavfilter-dev \
libavformat-dev \
libavutil-dev \
libswresample-dev \
libswscale-dev && \
rm -rf /var/lib/apt/lists/*
COPY requirements.txt .
RUN pip install --upgrade pip && pip install -r requirements.txt
ARG WHISPER_MODEL=Systran/faster-whisper-small
ARG LLM_MODEL=Qwen/Qwen2.5-0.5B-Instruct
ENV HF_HUB_ENABLE_HF_TRANSFER=0
RUN python - <<'PY'
import os
from huggingface_hub import snapshot_download
whisper = os.environ.get("WHISPER_MODEL")
llm = os.environ.get("LLM_MODEL")
if whisper:
snapshot_download(repo_id=whisper, local_dir="/models/whisper", local_dir_use_symlinks=False)
if llm:
snapshot_download(repo_id=llm, local_dir="/models/llm", local_dir_use_symlinks=False)
PY
COPY . .
EXPOSE 7860
CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "7860"]