We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8b78786 commit ca8f361Copy full SHA for ca8f361
ggml/src/ggml-cuda/fattn-wmma-f16.cuh
@@ -27,7 +27,7 @@ static bool ggml_cuda_should_use_wmma_fattn(const int cc) {
27
#if defined(GGML_USE_HIP) && !defined(GGML_HIP_ROCWMMA_FATTN)
28
return false;
29
#else
30
- if ((GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) == GGML_CUDA_CC_VOLTA) ||
+ if ((GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_VOLTA) ||
31
GGML_CUDA_CC_IS_RDNA3(cc) || GGML_CUDA_CC_IS_MTHREADS(cc)) {
32
return true;
33
} else if (GGML_CUDA_CC_IS_CDNA(cc)){
0 commit comments