We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 794d740 commit d70d9f0Copy full SHA for d70d9f0
ggml/src/ggml-cuda/fattn.cu
@@ -7,7 +7,7 @@
7
#include "fattn-vec-f32.cuh"
8
#include "fattn-wmma-f16.cuh"
9
#include "fattn.cuh"
10
-#include "ggml.h"
+#include "ggml-impl.h"
11
12
template <int D, int ncols2>
13
static void ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
0 commit comments