|
|
ARG BASE_IMAGE=ubuntu:24.04 |
|
|
ARG GRPC_BASE_IMAGE=${BASE_IMAGE} |
|
|
ARG INTEL_BASE_IMAGE=${BASE_IMAGE} |
|
|
ARG UBUNTU_CODENAME=noble |
|
|
|
|
|
FROM ${BASE_IMAGE} AS requirements |
|
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive |
|
|
|
|
|
RUN apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
ca-certificates curl wget espeak-ng libgomp1 \ |
|
|
ffmpeg libopenblas0 libopenblas-dev && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* |
|
|
|
|
|
|
|
|
FROM requirements AS requirements-drivers |
|
|
|
|
|
ARG BUILD_TYPE |
|
|
ARG CUDA_MAJOR_VERSION=12 |
|
|
ARG CUDA_MINOR_VERSION=0 |
|
|
ARG SKIP_DRIVERS=false |
|
|
ARG TARGETARCH |
|
|
ARG TARGETVARIANT |
|
|
ENV BUILD_TYPE=${BUILD_TYPE} |
|
|
ARG UBUNTU_VERSION=2404 |
|
|
|
|
|
RUN mkdir -p /run/localai |
|
|
RUN echo "default" > /run/localai/capability |
|
|
|
|
|
|
|
|
RUN <<EOT bash |
|
|
if [ "${BUILD_TYPE}" = "vulkan" ] && [ "${SKIP_DRIVERS}" = "false" ]; then |
|
|
apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
software-properties-common pciutils wget gpg-agent && \ |
|
|
apt-get install -y libglm-dev cmake libxcb-dri3-0 libxcb-present0 libpciaccess0 \ |
|
|
libpng-dev libxcb-keysyms1-dev libxcb-dri3-dev libx11-dev g++ gcc \ |
|
|
libwayland-dev libxrandr-dev libxcb-randr0-dev libxcb-ewmh-dev \ |
|
|
git python-is-python3 bison libx11-xcb-dev liblz4-dev libzstd-dev \ |
|
|
ocaml-core ninja-build pkg-config libxml2-dev wayland-protocols python3-jsonschema \ |
|
|
clang-format qtbase5-dev qt6-base-dev libxcb-glx0-dev sudo xz-utils mesa-vulkan-drivers |
|
|
if [ "amd64" = "$TARGETARCH" ]; then |
|
|
wget "https://sdk.lunarg.com/sdk/download/1.4.335.0/linux/vulkansdk-linux-x86_64-1.4.335.0.tar.xz" && \ |
|
|
tar -xf vulkansdk-linux-x86_64-1.4.335.0.tar.xz && \ |
|
|
rm vulkansdk-linux-x86_64-1.4.335.0.tar.xz && \ |
|
|
mkdir -p /opt/vulkan-sdk && \ |
|
|
mv 1.4.335.0 /opt/vulkan-sdk/ && \ |
|
|
cd /opt/vulkan-sdk/1.4.335.0 && \ |
|
|
./vulkansdk --no-deps --maxjobs \ |
|
|
vulkan-loader \ |
|
|
vulkan-validationlayers \ |
|
|
vulkan-extensionlayer \ |
|
|
vulkan-tools \ |
|
|
shaderc && \ |
|
|
cp -rfv /opt/vulkan-sdk/1.4.335.0/x86_64/bin/* /usr/bin/ && \ |
|
|
cp -rfv /opt/vulkan-sdk/1.4.335.0/x86_64/lib/* /usr/lib/x86_64-linux-gnu/ && \ |
|
|
cp -rfv /opt/vulkan-sdk/1.4.335.0/x86_64/include/* /usr/include/ && \ |
|
|
cp -rfv /opt/vulkan-sdk/1.4.335.0/x86_64/share/* /usr/share/ && \ |
|
|
rm -rf /opt/vulkan-sdk |
|
|
fi |
|
|
if [ "arm64" = "$TARGETARCH" ]; then |
|
|
mkdir vulkan && cd vulkan && \ |
|
|
curl -L -o vulkan-sdk.tar.xz https://github.com/mudler/vulkan-sdk-arm/releases/download/1.4.335.0/vulkansdk-ubuntu-24.04-arm-1.4.335.0.tar.xz && \ |
|
|
tar -xvf vulkan-sdk.tar.xz && \ |
|
|
rm vulkan-sdk.tar.xz && \ |
|
|
cd 1.4.335.0 && \ |
|
|
cp -rfv aarch64/bin/* /usr/bin/ && \ |
|
|
cp -rfv aarch64/lib/* /usr/lib/aarch64-linux-gnu/ && \ |
|
|
cp -rfv aarch64/include/* /usr/include/ && \ |
|
|
cp -rfv aarch64/share/* /usr/share/ && \ |
|
|
cd ../.. && \ |
|
|
rm -rf vulkan |
|
|
fi |
|
|
ldconfig && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* && \ |
|
|
echo "vulkan" > /run/localai/capability |
|
|
fi |
|
|
EOT |
|
|
|
|
|
|
|
|
RUN <<EOT bash |
|
|
if ( [ "${BUILD_TYPE}" = "cublas" ] || [ "${BUILD_TYPE}" = "l4t" ] ) && [ "${SKIP_DRIVERS}" = "false" ]; then |
|
|
apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
software-properties-common pciutils |
|
|
if [ "amd64" = "$TARGETARCH" ]; then |
|
|
curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu${UBUNTU_VERSION}/x86_64/cuda-keyring_1.1-1_all.deb |
|
|
fi |
|
|
if [ "arm64" = "$TARGETARCH" ]; then |
|
|
if [ "${CUDA_MAJOR_VERSION}" = "13" ]; then |
|
|
curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu${UBUNTU_VERSION}/sbsa/cuda-keyring_1.1-1_all.deb |
|
|
else |
|
|
curl -O https://developer.download.nvidia.com/compute/cuda/repos/ubuntu${UBUNTU_VERSION}/arm64/cuda-keyring_1.1-1_all.deb |
|
|
fi |
|
|
fi |
|
|
dpkg -i cuda-keyring_1.1-1_all.deb && \ |
|
|
rm -f cuda-keyring_1.1-1_all.deb && \ |
|
|
apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
cuda-nvcc-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \ |
|
|
libcufft-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \ |
|
|
libcurand-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \ |
|
|
libcublas-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \ |
|
|
libcusparse-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} \ |
|
|
libcusolver-dev-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} |
|
|
if [ "${CUDA_MAJOR_VERSION}" = "13" ] && [ "arm64" = "$TARGETARCH" ]; then |
|
|
apt-get install -y --no-install-recommends \ |
|
|
libcufile-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} libcudnn9-cuda-${CUDA_MAJOR_VERSION} cuda-cupti-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} libnvjitlink-${CUDA_MAJOR_VERSION}-${CUDA_MINOR_VERSION} |
|
|
fi |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* && \ |
|
|
echo "nvidia-cuda-${CUDA_MAJOR_VERSION}" > /run/localai/capability |
|
|
fi |
|
|
EOT |
|
|
|
|
|
RUN <<EOT bash |
|
|
if [ "${BUILD_TYPE}" = "cublas" ] && [ "${TARGETARCH}" = "arm64" ]; then |
|
|
echo "nvidia-l4t-cuda-${CUDA_MAJOR_VERSION}" > /run/localai/capability |
|
|
fi |
|
|
EOT |
|
|
|
|
|
|
|
|
RUN <<EOT bash |
|
|
if [ "${BUILD_TYPE}" = "cublas" ] && [ "${TARGETARCH}" = "arm64" ]; then |
|
|
wget https://developer.download.nvidia.com/compute/cudss/0.6.0/local_installers/cudss-local-tegra-repo-ubuntu${UBUNTU_VERSION}-0.6.0_0.6.0-1_arm64.deb && \ |
|
|
dpkg -i cudss-local-tegra-repo-ubuntu${UBUNTU_VERSION}-0.6.0_0.6.0-1_arm64.deb && \ |
|
|
cp /var/cudss-local-tegra-repo-ubuntu${UBUNTU_VERSION}-0.6.0/cudss-*-keyring.gpg /usr/share/keyrings/ && \ |
|
|
apt-get update && apt-get -y install cudss cudss-cuda-${CUDA_MAJOR_VERSION} && \ |
|
|
wget https://developer.download.nvidia.com/compute/nvpl/25.5/local_installers/nvpl-local-repo-ubuntu${UBUNTU_VERSION}-25.5_1.0-1_arm64.deb && \ |
|
|
dpkg -i nvpl-local-repo-ubuntu${UBUNTU_VERSION}-25.5_1.0-1_arm64.deb && \ |
|
|
cp /var/nvpl-local-repo-ubuntu${UBUNTU_VERSION}-25.5/nvpl-*-keyring.gpg /usr/share/keyrings/ && \ |
|
|
apt-get update && apt-get install -y nvpl |
|
|
fi |
|
|
EOT |
|
|
|
|
|
|
|
|
RUN if [ "${BUILD_TYPE}" = "clblas" ] && [ "${SKIP_DRIVERS}" = "false" ]; then \ |
|
|
apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
libclblast-dev && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* \ |
|
|
; fi |
|
|
|
|
|
RUN if [ "${BUILD_TYPE}" = "hipblas" ] && [ "${SKIP_DRIVERS}" = "false" ]; then \ |
|
|
apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
hipblas-dev \ |
|
|
rocblas-dev && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* && \ |
|
|
echo "amd" > /run/localai/capability && \ |
|
|
|
|
|
|
|
|
ldconfig \ |
|
|
; fi |
|
|
|
|
|
RUN if [ "${BUILD_TYPE}" = "hipblas" ]; then \ |
|
|
ln -s /opt/rocm-**/lib/llvm/lib/libomp.so /usr/lib/libomp.so \ |
|
|
; fi |
|
|
|
|
|
RUN expr "${BUILD_TYPE}" = intel && echo "intel" > /run/localai/capability || echo "not intel" |
|
|
|
|
|
|
|
|
ENV PATH=/usr/local/cuda/bin:${PATH} |
|
|
|
|
|
|
|
|
ENV PATH=/opt/rocm/bin:${PATH} |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM requirements-drivers AS build-requirements |
|
|
|
|
|
ARG GO_VERSION=1.25.4 |
|
|
ARG CMAKE_VERSION=3.31.10 |
|
|
ARG CMAKE_FROM_SOURCE=false |
|
|
ARG TARGETARCH |
|
|
ARG TARGETVARIANT |
|
|
|
|
|
RUN apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
build-essential \ |
|
|
ccache \ |
|
|
ca-certificates espeak-ng \ |
|
|
curl libssl-dev \ |
|
|
git \ |
|
|
git-lfs \ |
|
|
unzip upx-ucl python3 python-is-python3 && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* |
|
|
|
|
|
|
|
|
RUN <<EOT bash |
|
|
if [ "${CMAKE_FROM_SOURCE}" = "true" ]; then |
|
|
curl -L -s https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}.tar.gz -o cmake.tar.gz && tar xvf cmake.tar.gz && cd cmake-${CMAKE_VERSION} && ./configure && make && make install |
|
|
else |
|
|
apt-get update && \ |
|
|
apt-get install -y \ |
|
|
cmake && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* |
|
|
fi |
|
|
EOT |
|
|
|
|
|
|
|
|
RUN curl -L -s https://go.dev/dl/go${GO_VERSION}.linux-${TARGETARCH}.tar.gz | tar -C /usr/local -xz |
|
|
ENV PATH=$PATH:/root/go/bin:/usr/local/go/bin |
|
|
|
|
|
|
|
|
RUN go install google.golang.org/protobuf/cmd/protoc-gen-go@v1.34.2 && \ |
|
|
go install google.golang.org/grpc/cmd/protoc-gen-go-grpc@1958fcbe2ca8bd93af633f11e97d44e567e945af |
|
|
|
|
|
COPY --chmod=644 custom-ca-certs/* /usr/local/share/ca-certificates/ |
|
|
RUN update-ca-certificates |
|
|
|
|
|
RUN test -n "$TARGETARCH" \ |
|
|
|| (echo 'warn: missing $TARGETARCH, either set this `ARG` manually, or run using `docker buildkit`') |
|
|
|
|
|
|
|
|
RUN echo "Target Architecture: $TARGETARCH" |
|
|
RUN echo "Target Variant: $TARGETVARIANT" |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
WORKDIR /build |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM ${INTEL_BASE_IMAGE} AS intel |
|
|
ARG UBUNTU_CODENAME=noble |
|
|
RUN wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | \ |
|
|
gpg --yes --dearmor --output /usr/share/keyrings/intel-graphics.gpg |
|
|
RUN echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu ${UBUNTU_CODENAME}/lts/2350 unified" > /etc/apt/sources.list.d/intel-graphics.list |
|
|
RUN apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
intel-oneapi-runtime-libs && \ |
|
|
apt-get clean && \ |
|
|
rm -rf /var/lib/apt/lists/* |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM build-requirements AS builder-base |
|
|
|
|
|
ARG GO_TAGS="" |
|
|
ARG GRPC_BACKENDS |
|
|
ARG MAKEFLAGS |
|
|
ARG LD_FLAGS="-s -w" |
|
|
ARG TARGETARCH |
|
|
ARG TARGETVARIANT |
|
|
ENV GRPC_BACKENDS=${GRPC_BACKENDS} |
|
|
ENV GO_TAGS=${GO_TAGS} |
|
|
ENV MAKEFLAGS=${MAKEFLAGS} |
|
|
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility |
|
|
ENV NVIDIA_REQUIRE_CUDA="cuda>=${CUDA_MAJOR_VERSION}.0" |
|
|
ENV NVIDIA_VISIBLE_DEVICES=all |
|
|
ENV LD_FLAGS=${LD_FLAGS} |
|
|
|
|
|
RUN echo "GO_TAGS: $GO_TAGS" && echo "TARGETARCH: $TARGETARCH" |
|
|
|
|
|
WORKDIR /build |
|
|
|
|
|
|
|
|
|
|
|
RUN <<EOT bash |
|
|
if [ "amd64" = "$TARGETARCH" ]; then |
|
|
curl -L -s https://github.com/protocolbuffers/protobuf/releases/download/v27.1/protoc-27.1-linux-x86_64.zip -o protoc.zip && \ |
|
|
unzip -j -d /usr/local/bin protoc.zip bin/protoc && \ |
|
|
rm protoc.zip |
|
|
fi |
|
|
if [ "arm64" = "$TARGETARCH" ]; then |
|
|
curl -L -s https://github.com/protocolbuffers/protobuf/releases/download/v27.1/protoc-27.1-linux-aarch_64.zip -o protoc.zip && \ |
|
|
unzip -j -d /usr/local/bin protoc.zip bin/protoc && \ |
|
|
rm protoc.zip |
|
|
fi |
|
|
EOT |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM builder-base AS builder-backends |
|
|
ARG TARGETARCH |
|
|
ARG TARGETVARIANT |
|
|
|
|
|
WORKDIR /build |
|
|
|
|
|
COPY ./Makefile . |
|
|
COPY ./backend ./backend |
|
|
COPY ./go.mod . |
|
|
COPY ./go.sum . |
|
|
COPY ./.git ./.git |
|
|
|
|
|
|
|
|
COPY ./pkg/grpc ./pkg/grpc |
|
|
COPY ./pkg/utils ./pkg/utils |
|
|
COPY ./pkg/langchain ./pkg/langchain |
|
|
|
|
|
RUN ls -l ./ |
|
|
RUN make protogen-go |
|
|
|
|
|
|
|
|
|
|
|
FROM builder-backends AS builder |
|
|
|
|
|
WORKDIR /build |
|
|
|
|
|
COPY . . |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
RUN make build |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM builder-base AS devcontainer |
|
|
|
|
|
COPY .devcontainer-scripts /.devcontainer-scripts |
|
|
|
|
|
RUN apt-get update && \ |
|
|
apt-get install -y --no-install-recommends \ |
|
|
ssh less |
|
|
|
|
|
|
|
|
RUN go install github.com/go-delve/delve/cmd/dlv@latest |
|
|
|
|
|
RUN go install github.com/mikefarah/yq/v4@latest |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
FROM requirements-drivers |
|
|
|
|
|
ENV HEALTHCHECK_ENDPOINT=http://localhost:8080/readyz |
|
|
|
|
|
ARG CUDA_MAJOR_VERSION=12 |
|
|
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility |
|
|
ENV NVIDIA_REQUIRE_CUDA="cuda>=${CUDA_MAJOR_VERSION}.0" |
|
|
ENV NVIDIA_VISIBLE_DEVICES=all |
|
|
|
|
|
WORKDIR / |
|
|
|
|
|
COPY ./entrypoint.sh . |
|
|
|
|
|
|
|
|
COPY --from=builder /build/local-ai ./ |
|
|
|
|
|
|
|
|
RUN mkdir -p /models /backends |
|
|
|
|
|
|
|
|
HEALTHCHECK --interval=1m --timeout=10m --retries=10 \ |
|
|
CMD curl -f ${HEALTHCHECK_ENDPOINT} || exit 1 |
|
|
|
|
|
VOLUME /models /backends /configuration |
|
|
EXPOSE 8080 |
|
|
ENTRYPOINT [ "/entrypoint.sh" ] |
|
|
|