From 9b806250d4adf84f64d15022e32c6ae722c2e201 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Tue, 22 Jul 2025 18:47:31 +0200 Subject: [PATCH] chore: drop vllm for cuda 11 (#5881) Signed-off-by: Ettore Di Giacinto --- .github/workflows/backend.yml | 12 ------------ backend/index.yaml | 6 ------ 2 files changed, 18 deletions(-) diff --git a/.github/workflows/backend.yml b/.github/workflows/backend.yml index f05607848..e557fe74a 100644 --- a/.github/workflows/backend.yml +++ b/.github/workflows/backend.yml @@ -63,18 +63,6 @@ jobs: backend: "llama-cpp" dockerfile: "./backend/Dockerfile.llama-cpp" context: "./" - - build-type: 'cublas' - cuda-major-version: "11" - cuda-minor-version: "7" - platforms: 'linux/amd64' - tag-latest: 'auto' - tag-suffix: '-gpu-nvidia-cuda-11-vllm' - runs-on: 'ubuntu-latest' - base-image: "ubuntu:22.04" - skip-drivers: 'false' - backend: "vllm" - dockerfile: "./backend/Dockerfile.python" - context: "./backend" - build-type: 'cublas' cuda-major-version: "11" cuda-minor-version: "7" diff --git a/backend/index.yaml b/backend/index.yaml index 608854605..78fc441e0 100644 --- a/backend/index.yaml +++ b/backend/index.yaml @@ -502,9 +502,6 @@ nvidia: "cuda12-vllm-development" amd: "rocm-vllm-development" intel: "intel-sycl-f16-vllm-development" -- !!merge <<: *vllm - name: "cuda11-vllm" - uri: "quay.io/go-skynet/local-ai-backends:latest-gpu-nvidia-cuda-11-vllm" - !!merge <<: *vllm name: "cuda12-vllm" uri: "quay.io/go-skynet/local-ai-backends:latest-gpu-nvidia-cuda-12-vllm" @@ -517,9 +514,6 @@ - !!merge <<: *vllm name: "intel-sycl-f16-vllm" uri: "quay.io/go-skynet/local-ai-backends:latest-gpu-intel-sycl-f16-vllm" -- !!merge <<: *vllm - name: "cuda11-vllm-development" - uri: "quay.io/go-skynet/local-ai-backends:master-gpu-nvidia-cuda-11-vllm" - !!merge <<: *vllm name: "cuda12-vllm-development" uri: "quay.io/go-skynet/local-ai-backends:master-gpu-nvidia-cuda-12-vllm"