We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1d72c84 commit c29d5d4Copy full SHA for c29d5d4
ggml/src/ggml-cuda/common.cuh
@@ -312,7 +312,7 @@ static bool turing_mma_available(const int cc) {
312
}
313
314
static bool ampere_mma_available(const int cc) {
315
- return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
+ return GGML_CUDA_CC_IS_NVIDIA(cc) && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_AMPERE;
316
317
318
static bool cp_async_available(const int cc) {
0 commit comments