From 9ab647d54ace29668bea221da40857a7e965fa47 Mon Sep 17 00:00:00 2001 From: Weiqi Gao Date: Sun, 7 Dec 2025 18:53:56 +0800 Subject: [PATCH 1/4] Fix syntax for CUDA architecture definitions --- .github/workflows/build.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 8dd7ce19c..1f5bae306 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -163,7 +163,7 @@ jobs: - build: "avx512" defines: "-DGGML_NATIVE=OFF -DGGML_AVX512=ON -DGGML_AVX=ON -DGGML_AVX2=ON -DSD_BUILD_SHARED_LIBS=ON" - build: "cuda12" - defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES=90;89;86;80;75" + defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES='90;89;86;80;75'" - build: 'vulkan' defines: "-DSD_VULKAN=ON -DSD_BUILD_SHARED_LIBS=ON" steps: From 1f3378de0a53071d9c101e634e712accdc22b136 Mon Sep 17 00:00:00 2001 From: Weiqi Gao Date: Sun, 7 Dec 2025 19:11:52 +0800 Subject: [PATCH 2/4] Extend CUDA support to GTX 10 Series to RTX 50 Series --- .github/workflows/build.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 1f5bae306..dd7392081 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -163,7 +163,7 @@ jobs: - build: "avx512" defines: "-DGGML_NATIVE=OFF -DGGML_AVX512=ON -DGGML_AVX=ON -DGGML_AVX2=ON -DSD_BUILD_SHARED_LIBS=ON" - build: "cuda12" - defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES='90;89;86;80;75'" + defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES='61;70;75;80;86;89;90;100;103;120'" - build: 'vulkan' defines: "-DSD_VULKAN=ON -DSD_BUILD_SHARED_LIBS=ON" steps: @@ -178,7 +178,7 @@ jobs: if: ${{ matrix.build == 'cuda12' }} uses: Jimver/cuda-toolkit@v0.2.19 with: - cuda: "12.6.2" + cuda: "12.8.1" method: "network" sub-packages: '["nvcc", "cudart", "cublas", "cublas_dev", "thrust", "visual_studio_integration"]' From 09da54116015eaaa191a10a1f34a10e357034cd4 Mon Sep 17 00:00:00 2001 From: Weiqi Gao Date: Sun, 7 Dec 2025 20:27:03 +0800 Subject: [PATCH 3/4] update cuda installer step version to install cuda 12.8.1 --- .github/workflows/build.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index dd7392081..2f6a4ad1a 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -176,7 +176,7 @@ jobs: - name: Install cuda-toolkit id: cuda-toolkit if: ${{ matrix.build == 'cuda12' }} - uses: Jimver/cuda-toolkit@v0.2.19 + uses: Jimver/cuda-toolkit@v0.2.22 with: cuda: "12.8.1" method: "network" From c47281be0314371ec4be833bd0d52d07e340337c Mon Sep 17 00:00:00 2001 From: Weiqi Gao Date: Sun, 7 Dec 2025 20:57:22 +0800 Subject: [PATCH 4/4] Remove unsupported compute capability --- .github/workflows/build.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 2f6a4ad1a..7f78c354e 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -163,7 +163,7 @@ jobs: - build: "avx512" defines: "-DGGML_NATIVE=OFF -DGGML_AVX512=ON -DGGML_AVX=ON -DGGML_AVX2=ON -DSD_BUILD_SHARED_LIBS=ON" - build: "cuda12" - defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES='61;70;75;80;86;89;90;100;103;120'" + defines: "-DSD_CUDA=ON -DSD_BUILD_SHARED_LIBS=ON -DCMAKE_CUDA_ARCHITECTURES='61;70;75;80;86;89;90;100;120'" - build: 'vulkan' defines: "-DSD_VULKAN=ON -DSD_BUILD_SHARED_LIBS=ON" steps: