Spaces:
Sleeping
Sleeping
Fix build OOM: compile CUDA for A10G arch only, cap MAX_JOBS
Browse files- Dockerfile +7 -4
Dockerfile
CHANGED
|
@@ -17,10 +17,13 @@ FROM nvidia/cuda:12.8.0-devel-ubuntu22.04
|
|
| 17 |
ENV DEBIAN_FRONTEND=noninteractive \
|
| 18 |
PYTHONUNBUFFERED=1 \
|
| 19 |
PIP_NO_CACHE_DIR=1 \
|
| 20 |
-
#
|
| 21 |
-
#
|
| 22 |
-
#
|
| 23 |
-
TORCH_CUDA_ARCH_LIST="
|
|
|
|
|
|
|
|
|
|
| 24 |
|
| 25 |
# Build tools + extension headers (libglm-dev) and the OpenCV runtime libs
|
| 26 |
# (libgl1, libglib2.0-0 — optgs's COLMAP loader imports cv2).
|
|
|
|
| 17 |
ENV DEBIAN_FRONTEND=noninteractive \
|
| 18 |
PYTHONUNBUFFERED=1 \
|
| 19 |
PIP_NO_CACHE_DIR=1 \
|
| 20 |
+
# Build CUDA kernels for the A10G (compute 8.6) only; +PTX keeps them
|
| 21 |
+
# forward-compatible with newer GPUs via driver JIT. Compiling all
|
| 22 |
+
# architectures at once OOM-kills the HF builder.
|
| 23 |
+
TORCH_CUDA_ARCH_LIST="8.6+PTX" \
|
| 24 |
+
# Cap parallel nvcc jobs — gsplat's kernels are memory-heavy and the HF
|
| 25 |
+
# Docker builder has limited RAM; an unbounded build gets OOM-killed.
|
| 26 |
+
MAX_JOBS=2
|
| 27 |
|
| 28 |
# Build tools + extension headers (libglm-dev) and the OpenCV runtime libs
|
| 29 |
# (libgl1, libglib2.0-0 — optgs's COLMAP loader imports cv2).
|