FROM pytorch/pytorch:2.6.0-cuda12.6-cudnn9-devel

WORKDIR /app

RUN apt-get update && apt-get install -y git ffmpeg libsndfile1 build-essential && rm -rf /var/lib/apt/lists/*

RUN pip install --no-cache-dir \
    transformers einops loguru ormsgpack hydra-core omegaconf safetensors \
    soundfile datasets huggingface_hub tiktoken loralib pyrootutils natsort \
    librosa rich resampy pydub cachetools silero-vad descript-audio-codec \
    lightning zstandard opencc-python-reimplemented einx torchaudio

RUN git clone --depth 1 https://github.com/fishaudio/fish-speech.git /app/fish-speech && \
    cd /app/fish-speech && pip install --no-deps -e .

COPY gen_samples.py /app/gen_samples.py
COPY reference/ /app/reference/

ENV PYTHONPATH=/app/fish-speech:$PYTHONPATH
ENV TOKENIZERS_PARALLELISM=false
ENV MPLCONFIGDIR=/tmp/matplotlib
ENV HF_HOME=/tmp/hf_cache
ENV XDG_CACHE_HOME=/tmp/cache

CMD ["python", "/app/gen_samples.py"]