FROM ubuntu:24.04 WORKDIR /space RUN printf 'Acquire::Retries "5";\nAcquire::http::Timeout "30";\nAcquire::https::Timeout "30";\n' \ > /etc/apt/apt.conf.d/80-retries && \ apt-get update && \ apt-get install -y --fix-missing bash curl ffmpeg python3 python3-pip \ libomp5 libgomp1 && \ rm -rf /var/lib/apt/lists/* /var/cache/apt/archives/* # Pre-built binaries from GitHub Releases — avoids the 6+ minute C++ # compilation that exceeds the HF free-tier Docker build timeout. # v3: tarball with SOVERSION symlinks now includes lib symlinks (libcrispasr.so → libcrispasr.so.0.7.1 etc.) ARG BIN_URL=https://github.com/CrispStrobe/CrispASR/releases/download/hf-space-bin/crispasr-bin-linux-x64.tar.gz RUN mkdir -p /opt/crispasr/build/bin && \ curl -fSL "${BIN_URL}" -o /tmp/crispasr-bin.tar.gz && \ tar xzf /tmp/crispasr-bin.tar.gz -C /opt/crispasr/build/bin/ && \ rm /tmp/crispasr-bin.tar.gz && \ find /opt/crispasr/build/bin -name 'lib*.so*' -exec cp -a {} /usr/local/lib/ \; && \ ldconfig # Pre-download G2P dicts + kokoro model so TTS works on first call. RUN mkdir -p /cache/.cache/crispasr && \ curl -sL "https://huggingface.co/datasets/cstr/g2p-dicts/resolve/main/espeak_en.tsv" \ -o /cache/.cache/crispasr/espeak_en.tsv && \ curl -sL "https://raw.githubusercontent.com/cmusphinx/cmudict/refs/heads/master/cmudict.dict" \ -o /cache/.cache/crispasr/cmudict.dict && \ curl -sL "https://huggingface.co/cstr/kokoro-82m-GGUF/resolve/main/kokoro-82m-q8_0.gguf" \ -o /cache/kokoro-82m-q8_0.gguf && \ curl -sL "https://huggingface.co/cstr/kokoro-voices-GGUF/resolve/main/kokoro-voice-af_heart.gguf" \ -o /cache/kokoro-voice-af_heart.gguf && \ ls -lh /cache/ /cache/.cache/crispasr/ || true # Fetch bundled sample audio from the GitHub repo (optional). ARG CRISPASR_REPO=https://github.com/CrispStrobe/CrispASR RUN mkdir -p /space/samples && \ curl -sL "${CRISPASR_REPO}/raw/main/samples/jfk.wav" -o /space/samples/jfk.wav 2>/dev/null || true COPY requirements.txt /space/requirements.txt RUN pip3 install --no-cache-dir --break-system-packages -r /space/requirements.txt COPY app.py start.sh /space/ RUN chmod +x /space/start.sh && \ id -u 1000 >/dev/null 2>&1 || useradd -m -u 1000 app && \ mkdir -p /models /cache && \ chown -R 1000:1000 /space /opt/crispasr /models /cache ENV PATH=/opt/crispasr/build/bin:$PATH ENV HOME=/cache ENV CRISPASR_SERVER_URL=http://127.0.0.1:8080 ENV CRISPASR_CACHE_DIR=/cache ENV CRISPASR_SAMPLES_DIR=/space/samples ENV GRADIO_SERVER_NAME=0.0.0.0 ENV GRADIO_SERVER_PORT=7860 USER 1000 EXPOSE 7860 EXPOSE 8080 ENTRYPOINT ["/space/start.sh"]