We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1b25cbb commit f105e0fCopy full SHA for f105e0f
ggml/src/CMakeLists.txt
@@ -308,9 +308,9 @@ if (GGML_CUDA)
308
# 61 == integer CUDA intrinsics
309
# 70 == compute capability at which unrolling a loop in mul_mat_q kernels is faster
310
if (GGML_CUDA_F16 OR GGML_CUDA_DMMV_F16)
311
- set(CMAKE_CUDA_ARCHITECTURES "52;60;61;70;75;86")
+ set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75")
312
else()
313
- set(CMAKE_CUDA_ARCHITECTURES "52;61;70;75;86")
+ set(CMAKE_CUDA_ARCHITECTURES "52;61;70;75")
314
#set(CMAKE_CUDA_ARCHITECTURES "OFF") # use this to compile much faster, but only F16 models work
315
endif()
316
0 commit comments