Skip to content

Commit 1b54391

Browse files
committed
Revert "with forced wmma for cu11"
This reverts commit f545f4d.
1 parent c90a17d commit 1b54391

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

ggml/src/ggml-cuda/fattn.cu

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -396,9 +396,9 @@ static best_fattn_kernel ggml_cuda_get_best_fattn_kernel(const int device, const
396396
}
397397

398398
//kcpp: use wmma to fix cu11 incoherence
399-
if (fp16_mma_available(cc) && (ggml_cuda_highest_compiled_arch(cc) <= GGML_CUDA_CC_TURING || cc == GGML_CUDA_CC_TURING)) {
400-
return BEST_FATTN_KERNEL_WMMA_F16;
401-
}
399+
// if (fp16_mma_available(cc) && (ggml_cuda_highest_compiled_arch(cc) <= GGML_CUDA_CC_TURING || cc == GGML_CUDA_CC_TURING)) {
400+
// return BEST_FATTN_KERNEL_WMMA_F16;
401+
// }
402402
return BEST_FATTN_KERNEL_MMA_F16;
403403
}
404404

0 commit comments

Comments
 (0)