feat(vibevoice): add new backend (#7494)

* feat(vibevoice): add backend Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * chore: add workflow and backend index Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * chore(gallery): add vibevoice Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * Use self-hosted for intel builds Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * Pin python version for l4t Signed-off-by: Ettore Di Giacinto <mudler@localai.io> --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
2026-01-04 17:50:13 -06:00 · 2025-12-10 21:14:21 +01:00
parent ef44ace73f
commit 32dcb58e89
21 changed files with 1164 additions and 1 deletions
--- a/.github/workflows/backend.yml
+++ b/.github/workflows/backend.yml
@@ -198,6 +198,19 @@ jobs:
            context: "./backend"
            ubuntu-version: '2204'
          # CUDA 12 builds
+          - build-type: 'cublas'
+            cuda-major-version: "12"
+            cuda-minor-version: "0"
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-nvidia-cuda-12-vibevoice'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:22.04"
+            skip-drivers: 'false'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
          - build-type: 'cublas'
            cuda-major-version: "12"
            cuda-minor-version: "0"
@@ -407,6 +420,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: 'cublas'
+            cuda-major-version: "13"
+            cuda-minor-version: "0"
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-nvidia-cuda-13-vibevoice'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:22.04"
+            skip-drivers: 'false'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
          - build-type: 'cublas'
            cuda-major-version: "13"
            cuda-minor-version: "0"
@@ -459,6 +485,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: 'l4t'
+            cuda-major-version: "13"
+            cuda-minor-version: "0"
+            platforms: 'linux/arm64'
+            tag-latest: 'auto'
+            tag-suffix: '-nvidia-l4t-cuda-13-arm64-vibevoice'
+            runs-on: 'ubuntu-24.04-arm'
+            base-image: "ubuntu:24.04"
+            skip-drivers: 'false'
+            ubuntu-version: '2404'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
          - build-type: 'l4t'
            cuda-major-version: "13"
            cuda-minor-version: "0"
@@ -669,6 +708,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: 'hipblas'
+            cuda-major-version: ""
+            cuda-minor-version: ""
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-rocm-hipblas-vibevoice'
+            runs-on: 'arc-runner-set'
+            base-image: "rocm/dev-ubuntu-22.04:6.4.3"
+            skip-drivers: 'false'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
          - build-type: 'hipblas'
            cuda-major-version: ""
            cuda-minor-version: ""
@@ -787,6 +839,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: 'l4t'
+            cuda-major-version: "12"
+            cuda-minor-version: "0"
+            platforms: 'linux/arm64'
+            tag-latest: 'auto'
+            tag-suffix: '-nvidia-l4t-vibevoice'
+            runs-on: 'ubuntu-24.04-arm'
+            base-image: "nvcr.io/nvidia/l4t-jetpack:r36.4.0"
+            skip-drivers: 'true'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
          - build-type: 'l4t'
            cuda-major-version: "12"
            cuda-minor-version: "0"
@@ -827,6 +892,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: 'intel'
+            cuda-major-version: ""
+            cuda-minor-version: ""
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-intel-vibevoice'
+            runs-on: 'arc-runner-set'
+            base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
+            skip-drivers: 'false'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
          - build-type: 'intel'
            cuda-major-version: ""
            cuda-minor-version: ""
@@ -1319,6 +1397,19 @@ jobs:
            dockerfile: "./backend/Dockerfile.python"
            context: "./backend"
            ubuntu-version: '2204'
+          - build-type: ''
+            cuda-major-version: ""
+            cuda-minor-version: ""
+            platforms: 'linux/amd64,linux/arm64'
+            tag-latest: 'auto'
+            tag-suffix: '-cpu-vibevoice'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:22.04"
+            skip-drivers: 'false'
+            backend: "vibevoice"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./backend"
+            ubuntu-version: '2204'
  backend-jobs-darwin:
    uses: ./.github/workflows/backend_build_darwin.yml
    strategy: