Commit
·
718a38c
1
Parent(s):
6d4a711
jax fixings
Browse files- Dockerfile +5 -2
Dockerfile
CHANGED
|
@@ -30,10 +30,10 @@ RUN set -eux; \
|
|
| 30 |
ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
|
| 31 |
|
| 32 |
# Better allocator (less fragmentation than BFC during XLA autotune)
|
| 33 |
-
|
| 34 |
|
| 35 |
# Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
|
| 36 |
-
|
| 37 |
|
| 38 |
ENV DEBIAN_FRONTEND=noninteractive \
|
| 39 |
PYTHONUNBUFFERED=1 \
|
|
@@ -128,6 +128,9 @@ RUN python -m pip install --no-cache-dir --force-reinstall "protobuf==4.25.3"
|
|
| 128 |
|
| 129 |
RUN python -m pip install gradio
|
| 130 |
|
|
|
|
|
|
|
|
|
|
| 131 |
# Switch to Spaces’ preferred user
|
| 132 |
# Switch to Spaces’ preferred user
|
| 133 |
RUN useradd -m -u 1000 appuser
|
|
|
|
| 30 |
ENV LD_PRELOAD=/usr/local/cuda/lib64/libcusparse.so.12:/usr/local/cuda/lib64/libcublas.so.12:/usr/local/cuda/lib64/libcublasLt.so.12:/usr/local/cuda/lib64/libcufft.so.11:/usr/local/cuda/lib64/libcusolver.so.11
|
| 31 |
|
| 32 |
# Better allocator (less fragmentation than BFC during XLA autotune)
|
| 33 |
+
ENV TF_GPU_ALLOCATOR=cuda_malloc_async
|
| 34 |
|
| 35 |
# Let cuBLAS use TF32 fast path on Ada (L40S) for big GEMMs
|
| 36 |
+
ENV TF_ENABLE_CUBLAS_TF32=1 NVIDIA_TF32_OVERRIDE=1
|
| 37 |
|
| 38 |
ENV DEBIAN_FRONTEND=noninteractive \
|
| 39 |
PYTHONUNBUFFERED=1 \
|
|
|
|
| 128 |
|
| 129 |
RUN python -m pip install gradio
|
| 130 |
|
| 131 |
+
RUN python -m pip install --no-cache-dir --force-reinstall \
|
| 132 |
+
"jax==0.7.1" "jaxlib==0.7.1" "jax[cuda12]==0.7.1"
|
| 133 |
+
|
| 134 |
# Switch to Spaces’ preferred user
|
| 135 |
# Switch to Spaces’ preferred user
|
| 136 |
RUN useradd -m -u 1000 appuser
|