|
|
--- |
|
|
name: 'build backend container images' |
|
|
|
|
|
on: |
|
|
push: |
|
|
branches: |
|
|
- master |
|
|
tags: |
|
|
- '*' |
|
|
|
|
|
concurrency: |
|
|
group: ci-backends-${{ github.head_ref || github.ref }}-${{ github.repository }} |
|
|
cancel-in-progress: true |
|
|
|
|
|
jobs: |
|
|
backend-jobs: |
|
|
uses: ./.github/workflows/backend_build.yml |
|
|
with: |
|
|
tag-latest: ${{ matrix.tag-latest }} |
|
|
tag-suffix: ${{ matrix.tag-suffix }} |
|
|
build-type: ${{ matrix.build-type }} |
|
|
cuda-major-version: ${{ matrix.cuda-major-version }} |
|
|
cuda-minor-version: ${{ matrix.cuda-minor-version }} |
|
|
platforms: ${{ matrix.platforms }} |
|
|
runs-on: ${{ matrix.runs-on }} |
|
|
base-image: ${{ matrix.base-image }} |
|
|
backend: ${{ matrix.backend }} |
|
|
dockerfile: ${{ matrix.dockerfile }} |
|
|
skip-drivers: ${{ matrix.skip-drivers }} |
|
|
context: ${{ matrix.context }} |
|
|
ubuntu-version: ${{ matrix.ubuntu-version }} |
|
|
secrets: |
|
|
dockerUsername: ${{ secrets.DOCKERHUB_USERNAME }} |
|
|
dockerPassword: ${{ secrets.DOCKERHUB_PASSWORD }} |
|
|
quayUsername: ${{ secrets.LOCALAI_REGISTRY_USERNAME }} |
|
|
quayPassword: ${{ secrets.LOCALAI_REGISTRY_PASSWORD }} |
|
|
strategy: |
|
|
fail-fast: false |
|
|
|
|
|
matrix: |
|
|
include: |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-diffusers' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
skip-drivers: 'true' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-diffusers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'true' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-chatterbox' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'true' |
|
|
backend: "chatterbox" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-moonshine' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'true' |
|
|
backend: "moonshine" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-vibevoice' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-pocket-tts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-rerankers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rerankers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-vllm' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vllm" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-transformers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "transformers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-diffusers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-kokoro' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "kokoro" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-faster-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "faster-whisper" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-coqui' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "coqui" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-bark' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "bark" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-chatterbox' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "chatterbox" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-moonshine' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "moonshine" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-rfdetr' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rfdetr" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-exllama2' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "exllama2" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "9" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-12-neutts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "neutts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-rerankers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rerankers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-vibevoice' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-pocket-tts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-llama-cpp' |
|
|
base-image: "ubuntu:24.04" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
ubuntu-version: '2404' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-transformers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "transformers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-diffusers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-vibevoice' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
ubuntu-version: '2404' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-pocket-tts' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
ubuntu-version: '2404' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-diffusers' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
ubuntu-version: '2404' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-kokoro' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "kokoro" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-faster-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "faster-whisper" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-bark' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "bark" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-chatterbox' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "chatterbox" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-moonshine' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "moonshine" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-stablediffusion-ggml' |
|
|
base-image: "ubuntu:24.04" |
|
|
ubuntu-version: '2404' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-cuda-13-arm64-whisper' |
|
|
base-image: "ubuntu:24.04" |
|
|
ubuntu-version: '2404' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "13" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-nvidia-cuda-13-rfdetr' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rfdetr" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-rerankers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "rerankers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-vllm' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "vllm" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-transformers' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "transformers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-diffusers' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-kokoro' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "kokoro" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-vibevoice' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-pocket-tts' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-faster-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "faster-whisper" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-coqui' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "coqui" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-bark' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "bark" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-rerankers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rerankers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f32' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f32-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f16' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f16-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-vllm' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vllm" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-transformers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "transformers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-diffusers' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "diffusers" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-vibevoice' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
skip-drivers: 'true' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-pocket-tts' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
skip-drivers: 'true' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-kokoro' |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
skip-drivers: 'true' |
|
|
backend: "kokoro" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
|
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-kokoro' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "kokoro" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-faster-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "faster-whisper" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-vibevoice' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-pocket-tts' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-coqui' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "coqui" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-bark' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "bark" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-piper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "piper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-bark-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "bark-cpp" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-llama-cpp' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: 'vulkan' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-vulkan-llama-cpp' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "llama-cpp" |
|
|
dockerfile: "./backend/Dockerfile.llama-cpp" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f32' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f32-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f16' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f16-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'vulkan' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-vulkan-stablediffusion-ggml' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-stablediffusion-ggml' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "stablediffusion-ggml" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f32' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f32-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'sycl_f16' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-sycl-f16-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'vulkan' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-vulkan-whisper' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'cublas' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'false' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-whisper' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-whisper' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
runs-on: 'ubuntu-latest' |
|
|
skip-drivers: 'false' |
|
|
backend: "whisper" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-silero-vad' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "silero-vad" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-local-store' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "local-store" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-huggingface' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "huggingface" |
|
|
dockerfile: "./backend/Dockerfile.golang" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-rfdetr' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rfdetr" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-rfdetr' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "rfdetr" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'true' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-rfdetr' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "rfdetr" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-exllama2' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "exllama2" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'intel' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-intel-exllama2' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "intel/oneapi-basekit:2025.3.0-0-devel-ubuntu24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "exllama2" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
skip-drivers: 'true' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-hipblas-exllama2' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
runs-on: 'ubuntu-latest' |
|
|
backend: "exllama2" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'true' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-chatterbox' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "chatterbox" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-kitten-tts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "kitten-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
|
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-neutts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "neutts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'hipblas' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-gpu-rocm-hipblas-neutts' |
|
|
runs-on: 'arc-runner-set' |
|
|
base-image: "rocm/dev-ubuntu-24.04:6.4.4" |
|
|
skip-drivers: 'false' |
|
|
backend: "neutts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: 'l4t' |
|
|
cuda-major-version: "12" |
|
|
cuda-minor-version: "0" |
|
|
platforms: 'linux/arm64' |
|
|
skip-drivers: 'true' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-nvidia-l4t-arm64-neutts' |
|
|
base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0" |
|
|
runs-on: 'ubuntu-24.04-arm' |
|
|
backend: "neutts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2204' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-vibevoice' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "vibevoice" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
- build-type: '' |
|
|
cuda-major-version: "" |
|
|
cuda-minor-version: "" |
|
|
platforms: 'linux/amd64,linux/arm64' |
|
|
tag-latest: 'auto' |
|
|
tag-suffix: '-cpu-pocket-tts' |
|
|
runs-on: 'ubuntu-latest' |
|
|
base-image: "ubuntu:24.04" |
|
|
skip-drivers: 'false' |
|
|
backend: "pocket-tts" |
|
|
dockerfile: "./backend/Dockerfile.python" |
|
|
context: "./" |
|
|
ubuntu-version: '2404' |
|
|
backend-jobs-darwin: |
|
|
uses: ./.github/workflows/backend_build_darwin.yml |
|
|
strategy: |
|
|
matrix: |
|
|
include: |
|
|
- backend: "diffusers" |
|
|
tag-suffix: "-metal-darwin-arm64-diffusers" |
|
|
build-type: "mps" |
|
|
- backend: "mlx" |
|
|
tag-suffix: "-metal-darwin-arm64-mlx" |
|
|
build-type: "mps" |
|
|
- backend: "chatterbox" |
|
|
tag-suffix: "-metal-darwin-arm64-chatterbox" |
|
|
build-type: "mps" |
|
|
- backend: "mlx-vlm" |
|
|
tag-suffix: "-metal-darwin-arm64-mlx-vlm" |
|
|
build-type: "mps" |
|
|
- backend: "mlx-audio" |
|
|
tag-suffix: "-metal-darwin-arm64-mlx-audio" |
|
|
build-type: "mps" |
|
|
- backend: "stablediffusion-ggml" |
|
|
tag-suffix: "-metal-darwin-arm64-stablediffusion-ggml" |
|
|
build-type: "metal" |
|
|
lang: "go" |
|
|
- backend: "whisper" |
|
|
tag-suffix: "-metal-darwin-arm64-whisper" |
|
|
build-type: "metal" |
|
|
lang: "go" |
|
|
with: |
|
|
backend: ${{ matrix.backend }} |
|
|
build-type: ${{ matrix.build-type }} |
|
|
go-version: "1.24.x" |
|
|
tag-suffix: ${{ matrix.tag-suffix }} |
|
|
lang: ${{ matrix.lang || 'python' }} |
|
|
use-pip: ${{ matrix.backend == 'diffusers' }} |
|
|
runs-on: "macos-latest" |
|
|
secrets: |
|
|
dockerUsername: ${{ secrets.DOCKERHUB_USERNAME }} |
|
|
dockerPassword: ${{ secrets.DOCKERHUB_PASSWORD }} |
|
|
quayUsername: ${{ secrets.LOCALAI_REGISTRY_USERNAME }} |
|
|
quayPassword: ${{ secrets.LOCALAI_REGISTRY_PASSWORD }} |
|
|
llama-cpp-darwin: |
|
|
runs-on: macos-latest |
|
|
strategy: |
|
|
matrix: |
|
|
go-version: ['1.25.x'] |
|
|
steps: |
|
|
- name: Clone |
|
|
uses: actions/checkout@v6 |
|
|
with: |
|
|
submodules: true |
|
|
- name: Setup Go ${{ matrix.go-version }} |
|
|
uses: actions/setup-go@v5 |
|
|
with: |
|
|
go-version: ${{ matrix.go-version }} |
|
|
cache: false |
|
|
|
|
|
- name: Display Go version |
|
|
run: go version |
|
|
- name: Dependencies |
|
|
run: | |
|
|
brew install protobuf grpc make protoc-gen-go protoc-gen-go-grpc libomp llvm |
|
|
- name: Build llama-cpp-darwin |
|
|
run: | |
|
|
make protogen-go |
|
|
make backends/llama-cpp-darwin |
|
|
- name: Upload llama-cpp.tar |
|
|
uses: actions/upload-artifact@v6 |
|
|
with: |
|
|
name: llama-cpp-tar |
|
|
path: backend-images/llama-cpp.tar |
|
|
llama-cpp-darwin-publish: |
|
|
needs: llama-cpp-darwin |
|
|
if: github.event_name != 'pull_request' |
|
|
runs-on: ubuntu-latest |
|
|
steps: |
|
|
- name: Download llama-cpp.tar |
|
|
uses: actions/download-artifact@v7 |
|
|
with: |
|
|
name: llama-cpp-tar |
|
|
path: . |
|
|
- name: Install crane |
|
|
run: | |
|
|
curl -L https://github.com/google/go-containerregistry/releases/latest/download/go-containerregistry_Linux_x86_64.tar.gz | tar -xz |
|
|
sudo mv crane /usr/local/bin/ |
|
|
- name: Log in to DockerHub |
|
|
run: | |
|
|
echo "${{ secrets.DOCKERHUB_PASSWORD }}" | crane auth login docker.io -u "${{ secrets.DOCKERHUB_USERNAME }}" --password-stdin |
|
|
- name: Log in to quay.io |
|
|
run: | |
|
|
echo "${{ secrets.LOCALAI_REGISTRY_PASSWORD }}" | crane auth login quay.io -u "${{ secrets.LOCALAI_REGISTRY_USERNAME }}" --password-stdin |
|
|
- name: Docker meta |
|
|
id: meta |
|
|
uses: docker/metadata-action@v5 |
|
|
with: |
|
|
images: | |
|
|
localai/localai-backends |
|
|
tags: | |
|
|
type=ref,event=branch |
|
|
type=semver,pattern={{raw}} |
|
|
type=sha |
|
|
flavor: | |
|
|
latest=auto |
|
|
suffix=-metal-darwin-arm64-llama-cpp,onlatest=true |
|
|
- name: Docker meta |
|
|
id: quaymeta |
|
|
uses: docker/metadata-action@v5 |
|
|
with: |
|
|
images: | |
|
|
quay.io/go-skynet/local-ai-backends |
|
|
tags: | |
|
|
type=ref,event=branch |
|
|
type=semver,pattern={{raw}} |
|
|
type=sha |
|
|
flavor: | |
|
|
latest=auto |
|
|
suffix=-metal-darwin-arm64-llama-cpp,onlatest=true |
|
|
- name: Push Docker image (DockerHub) |
|
|
run: | |
|
|
for tag in $(echo "${{ steps.meta.outputs.tags }}" | tr ',' '\n'); do |
|
|
crane push llama-cpp.tar $tag |
|
|
done |
|
|
- name: Push Docker image (Quay) |
|
|
run: | |
|
|
for tag in $(echo "${{ steps.quaymeta.outputs.tags }}" | tr ',' '\n'); do |
|
|
crane push llama-cpp.tar $tag |
|
|
done |
|
|
|