Spaces:

thecollabagepatch
/

magenta-retry

Running

App Files Files Community

magenta-retry / Dockerfile

thecollabagepatch

i think we did it? gradio with fastrtc v1

c8f33f0 4 months ago

raw

history blame contribute delete

6.68 kB

	# Dockerfile for HuggingFace Space deployment (x86_64)
	# Based on working Modal Dockerfile.x86
	FROM nvidia/cuda:12.6.2-cudnn-runtime-ubuntu22.04

	# Ensure CUDA libraries are on loader path
	RUN apt-get update && apt-get install -y --no-install-recommends \
	cuda-libraries-12-4 && rm -rf /var/lib/apt/lists/*
	ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/cuda-12.4/lib64:/usr/local/cuda-12.4/compat:/usr/local/cuda/targets/x86_64-linux/lib:${LD_LIBRARY_PATH}
	RUN ln -sf /usr/local/cuda/targets/x86_64-linux/lib /usr/local/cuda/lib64 \|\| true

	# Install cuDNN 9.8 for better compatibility
	RUN set -eux; \
	apt-get update && apt-get install -y --no-install-recommends gnupg ca-certificates curl; \
	install -d -m 0755 /usr/share/keyrings; \
	curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/3bf863cc.pub \
	\| gpg --batch --yes --dearmor -o /usr/share/keyrings/cuda-archive-keyring.gpg; \
	apt-get update; \
	apt-mark unhold libcudnn9-cuda-12 \|\| true; \
	apt-get install -y --no-install-recommends \
	'libcudnn9-cuda-12=9.8.*' \
	'libcudnn9-dev-cuda-12=9.8.*' \
	--allow-downgrades --allow-change-held-packages; \
	apt-mark hold libcudnn9-cuda-12 \|\| true; \
	ldconfig; \
	rm -rf /var/lib/apt/lists/*

	# Performance optimizations for L40S/Ada
	ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
	ENV TF_GPU_ALLOCATOR=cuda_malloc_async
	ENV TF_ENABLE_CUBLAS_TF32=1 NVIDIA_TF32_OVERRIDE=1

	ENV DEBIAN_FRONTEND=noninteractive \
	PYTHONUNBUFFERED=1 \
	PIP_NO_CACHE_DIR=1 \
	TF_FORCE_GPU_ALLOW_GROWTH=true \
	XLA_PYTHON_CLIENT_PREALLOCATE=false \
	JAX_PLATFORMS="cuda"

	SHELL ["/bin/bash", "-c"]

	# Install system dependencies
	RUN apt-get update && apt-get install -y --no-install-recommends \
	software-properties-common curl ca-certificates \
	build-essential pkg-config git \
	libsndfile1 ffmpeg \
	&& add-apt-repository ppa:deadsnakes/ppa -y \
	&& apt-get update && apt-get install -y --no-install-recommends \
	python3.11 python3.11-dev python3.11-venv python3-pip \
	&& rm -rf /var/lib/apt/lists/*

	# Make python3.11 default and install uv for faster package installs
	RUN ln -sf /usr/bin/python3.11 /usr/bin/python && \
	ln -sf /usr/bin/python3.11 /usr/bin/python3 && \
	python -m pip install --upgrade pip && \
	python -m pip install uv

	# CRITICAL: Install TensorFlow FIRST to block tensorflow-cpu
	RUN uv pip install --system tf-nightly

	# Install JAX with CUDA support (pinned for stability)
	RUN uv pip install --system "jax[cuda12]==0.7.1" jaxlib

	# -------------------------------------------------------------------
	# HARD STABILIZER: prevent resampy->numba from selecting py<3.10-only wheels
	# Also keep numpy < 2 to avoid later numba incompat headaches on py311.
	# -------------------------------------------------------------------
	RUN printf "numpy<2\nnumba>=0.57.0\nllvmlite>=0.40.0\n" > /tmp/constraints.txt && \
	echo "---- constraints.txt ----" && \
	cat /tmp/constraints.txt && \
	echo "------------------------"

	# (Optional but often helpful) install pinned trio first so they land as wheels cleanly,
	# then everything else resolves around them.
	RUN uv pip install --system -c /tmp/constraints.txt "numpy<2" "numba>=0.57.0" "llvmlite>=0.40.0"

	# Install base dependencies (constraints applied)
	RUN uv pip install --system -c /tmp/constraints.txt \
	absl-py chex gin-config numpy requests tqdm typing-extensions \
	google-cloud-storage librosa resampy soundfile sentencepiece

	# Clone and install t5x WITHOUT dependencies (avoid tensorflow-cpu)
	RUN git clone https://github.com/google-research/t5x.git /t5x && \
	cd /t5x && \
	git checkout 92c5b467a5964d06c351c7eae4aa4bcd341c7ded && \
	uv pip install --system --no-deps -e .

	# Install flaxformer without deps
	RUN git clone https://github.com/google/flaxformer.git /flaxformer && \
	cd /flaxformer && \
	git checkout 399ea3a && \
	uv pip install --system --no-deps -e .

	# Install seqio without deps and PATCH OUT tensorflow_text
	RUN git clone https://github.com/google/seqio.git /seqio && \
	cd /seqio && \
	uv pip install --system --no-deps -e . && \
	sed -i '/import tensorflow_text as tf_text/d' /seqio/seqio/vocabularies.py

	# Install airio (t5x dependency) without deps
	RUN git clone https://github.com/google/airio.git /airio && \
	cd /airio && \
	uv pip install --system --no-deps -e .

	# Install clu without deps
	RUN git clone https://github.com/google/CommonLoopUtils.git /clu && \
	cd /clu && \
	uv pip install --system --no-deps -e .

	# Now install all remaining dependencies these packages need (constraints applied)
	RUN uv pip install --system -c /tmp/constraints.txt \
	flax optax orbax-checkpoint \
	fiddle cached_property tf2jax \
	aqtp etils jestimator \
	tensorflow-datasets tfds-nightly \
	apache-beam pyyaml rouge-score sacrebleu scipy \
	grain-nightly editdistance pyglove

	# Patch jestimator for newer JAX - PartitionSpec moved to jax.sharding
	RUN sed -i 's\|from jax.experimental.pjit import PartitionSpec\|from jax.sharding import PartitionSpec\|g' \
	/usr/local/lib/python3.11/dist-packages/jestimator/amos_helper.py \|\| \
	sed -i 's\|from jax.experimental.pjit import PartitionSpec\|from jax.sharding import PartitionSpec\|g' \
	/usr/lib/python3.11/dist-packages/jestimator/amos_helper.py \|\| true

	# Install magenta-realtime without deps
	RUN git clone https://github.com/magenta/magenta-realtime.git /magenta-realtime-src && \
	cd /magenta-realtime-src && \
	uv pip install --system --no-deps -e .

	# API and audio processing dependencies (constraints applied)
	RUN uv pip install --system -c /tmp/constraints.txt \
	fastapi uvicorn[standard] python-multipart \
	pyloudnorm gradio soxr huggingface_hub

	# Ensure compatible protobuf version
	RUN uv pip install --system --force-reinstall "protobuf>=5.27.0"

	RUN uv pip install --system fastrtc

	# Set working directory and create cache
	WORKDIR /app
	ENV MAGENTA_RT_CACHE_DIR=/root/.cache/magenta_rt
	RUN mkdir -p $MAGENTA_RT_CACHE_DIR

	# Copy application files for HuggingFace Space
	COPY app.py /app/
	COPY utils.py /app/
	COPY jam_worker.py /app/
	COPY one_shot_generation.py /app/
	COPY model_management.py /app/
	COPY documentation.html /app/
	COPY lil_demo_540p.mp4 /app/
	COPY magentaRT_rt_tester.html /app/
	COPY magenta_prompts.js /app/
	COPY docs/ /app/docs/
	COPY fastrtc_magenta.py /app/

	EXPOSE 7860
	CMD ["python", "-m", "uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]