We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4721a56 commit 6a199ddCopy full SHA for 6a199dd
ggml/src/ggml-cuda/fattn-mma-f16.cuh
@@ -874,8 +874,6 @@ static __device__ __forceinline__ void flash_attn_ext_f16_process_tile(
874
}
875
876
877
- __syncthreads();
878
-
879
// Write back combined meta data:
880
#pragma unroll
881
for (int imeta = 0; imeta < nmeta; ++imeta) {
ggml/src/ggml-cuda/fattn-vec-f16.cuh
@@ -168,7 +168,6 @@ static __global__ void flash_attn_vec_ext_f16(
168
for (int j = 0; j < ncols; ++j) {
169
KQ[j*D + tid] = -HALF_MAX_HALF;
170
171
172
173
half2 VKQ[ncols] = {{0.0f, 0.0f}};
174
0 commit comments