Skip to content

Commit 373d48e

Browse files
committed
Use GGML_CUDA_CC_IS_CDNA for checking CDNA architectures.
1 parent a135b4c commit 373d48e

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/common.cuh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -232,14 +232,14 @@ static bool fp16_mma_available(const int cc) {
232232
return false;
233233
#else
234234
return cc < GGML_CUDA_CC_OFFSET_AMD && ggml_cuda_highest_compiled_arch(cc) >= GGML_CUDA_CC_VOLTA ||
235-
cc >= GGML_CUDA_CC_CDNA && cc < GGML_CUDA_CC_RDNA1 || cc >= GGML_CUDA_CC_RDNA3;
235+
GGML_CUDA_CC_IS_CDNA(cc) || cc >= GGML_CUDA_CC_RDNA3;
236236
#endif // defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__) && !defined(GGML_HIP_ROCWMMA_FATTN)
237237
}
238238

239239
// To be used for feature selection of external libraries, e.g. cuBLAS.
240240
static bool fp16_mma_hardware_available(const int cc) {
241241
return cc < GGML_CUDA_CC_OFFSET_AMD && cc >= GGML_CUDA_CC_VOLTA ||
242-
cc >= GGML_CUDA_CC_CDNA && cc < GGML_CUDA_CC_RDNA1 || cc >= GGML_CUDA_CC_RDNA3;
242+
GGML_CUDA_CC_IS_CDNA(cc) || cc >= GGML_CUDA_CC_RDNA3;
243243
}
244244

245245
// Volta technically had FP16 tensor cores but they work very differently compared to Turing and later.

0 commit comments

Comments
 (0)