Skip to content

Commit 9bef18c

Browse files
committed
ci: narrow CUDA wheel architectures
1 parent b516373 commit 9bef18c

1 file changed

Lines changed: 4 additions & 1 deletion

File tree

.github/workflows/build-wheels-cuda.yaml

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -133,7 +133,10 @@ jobs:
133133
$env:CMAKE_ARGS = ''
134134
}
135135
$env:VERBOSE = '1'
136-
$env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON -DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=all -DCMAKE_CUDA_FLAGS=--allow-unsupported-compiler $env:CMAKE_ARGS"
136+
# Match upstream llama.cpp CI by targeting a conservative set of
137+
# CUDA architectures instead of `all`, which now includes newer
138+
# virtual architectures some toolkit versions cannot assemble.
139+
$env:CMAKE_ARGS = "-DGGML_CUDA_FORCE_MMQ=ON -DGGML_CUDA=on -DCMAKE_CUDA_ARCHITECTURES=61;70;75;80;86;89 -DCMAKE_CUDA_FLAGS=--allow-unsupported-compiler $env:CMAKE_ARGS"
137140
# if ($env:AVXVER -eq 'AVX') {
138141
$env:CMAKE_ARGS = $env:CMAKE_ARGS + ' -DGGML_AVX2=off -DGGML_FMA=off -DGGML_F16C=off'
139142
# }

0 commit comments

Comments
 (0)