Skip to content

Commit 6d7ef15

Browse files
authored
Recover FP16 performance and improve general performance
1 parent 36201c6 commit 6d7ef15

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/src/ggml-cuda/common.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -268,7 +268,7 @@ static bool fast_fp16_available(const int cc) {
268268

269269
// To be used for feature selection of external libraries, e.g. cuBLAS.
270270
static bool fast_fp16_hardware_available(const int cc) {
271-
return (GGML_CUDA_CC_IS_NVIDIA(cc) && cc >= GGML_CUDA_CC_PASCAL && cc != 610) || GGML_CUDA_CC_IS_AMD(cc) ||
271+
return (GGML_CUDA_CC_IS_NVIDIA(cc) && cc >= GGML_CUDA_CC_PASCAL && cc != 610 && !MMA_DISABLE) || GGML_CUDA_CC_IS_AMD(cc) ||
272272
(GGML_CUDA_CC_IS_MTHREADS(cc) && cc >= GGML_CUDA_CC_QY2);
273273
}
274274

0 commit comments

Comments
 (0)