We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 066b909 commit fa7ea97Copy full SHA for fa7ea97
ggml/src/ggml-cuda/fattn-wmma-f16.cu
@@ -56,7 +56,7 @@ static __global__ void flash_attn_ext_f16(
56
const int ne1,
57
const int ne2,
58
const int ne3) {
59
-#if defined(FLASH_ATTN_AVAILABLE) && ((__CUDA_ARCH__ == GGML_CUDA_CC_VOLTA || __CUDA_ARCH__ == GGML_CUDA_CC_TURING) || (defined(GGML_HIP_ROCWMMA_FATTN) && defined(FP16_MMA_AVAILABLE)))
+#if 0
60
// Skip unused kernel variants for faster compilation:
61
if (use_logit_softcap && !(D == 128 || D == 256)) {
62
NO_DEVICE_CODE;
0 commit comments