We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 35ce3f6 commit 1e0f64eCopy full SHA for 1e0f64e
ggml/src/CMakeLists.txt
@@ -285,9 +285,9 @@ if (GGML_CUDA)
285
# 61 == integer CUDA intrinsics
286
# 70 == compute capability at which unrolling a loop in mul_mat_q kernels is faster
287
if (GGML_CUDA_F16 OR GGML_CUDA_DMMV_F16)
288
- set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75")
+ set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75;86")
289
else()
290
- set(CMAKE_CUDA_ARCHITECTURES "52;61;70;75")
+ set(CMAKE_CUDA_ARCHITECTURES "52;61;70;75;86")
291
#set(CMAKE_CUDA_ARCHITECTURES "OFF") # use this to compile much faster, but only F16 models work
292
endif()
293
0 commit comments