File tree Expand file tree Collapse file tree 1 file changed +4
-0
lines changed Expand file tree Collapse file tree 1 file changed +4
-0
lines changed Original file line number Diff line number Diff line change @@ -237,8 +237,12 @@ static bool fp16_mma_available(const int cc) {
237237
238238// To be used for feature selection of external libraries, e.g. cuBLAS.
239239static bool fp16_mma_hardware_available (const int cc) {
240+ #if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__) && !defined(GGML_HIP_ROCWMMA_FATTN)
241+ return false ;
242+ #else
240243 return cc < GGML_CUDA_CC_OFFSET_AMD && cc >= GGML_CUDA_CC_VOLTA ||
241244 cc >= GGML_CUDA_CC_CDNA && cc < GGML_CUDA_CC_RDNA1 || cc >= GGML_CUDA_CC_RDNA3;
245+ #endif // defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__) && !defined(GGML_HIP_ROCWMMA_FATTN)
242246}
243247
244248// Volta technically had FP16 tensor cores but they work very differently compared to Turing and later.
You can’t perform that action at this time.
0 commit comments