FROM python:3.9-slim

WORKDIR /code

# Copy requirements (make sure it includes soundfile)
COPY ./requirements.txt /code/requirements.txt

# Install system deps for ffmpeg + audio libs
RUN apt-get update && apt-get install -y ffmpeg libsndfile1 && rm -rf /var/lib/apt/lists/*

# Install Python deps
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt

# Use HF_HOME to control transformers cache location
ENV HF_HOME=/code/hf_cache
RUN mkdir -p /code/hf_cache && chmod -R 777 /code/hf_cache

# Pre-download ASR model at build time (so runtime doesn't download/cache)
RUN python - <<'PY'
from transformers import pipeline
pipeline('automatic-speech-recognition', model='distil-whisper/distil-large-v3')
PY

COPY ./app.py /code/app.py

EXPOSE 7860
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]