@@ -767,14 +767,11 @@ static __device__ __forceinline__ void flash_attn_ext_f16_iter(
767767 }
768768 }
769769#else
770- GGML_UNUSED (Q_f2); GGML_UNUSED (K_h2); GGML_UNUSED (V_h2);
771- GGML_UNUSED (mask_h2); GGML_UNUSED (dstk); GGML_UNUSED (dstk_fixup);
772- GGML_UNUSED (scale); GGML_UNUSED (slope); GGML_UNUSED (logit_softcap);
773- GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (stride_K); GGML_UNUSED (stride_V);
774- GGML_UNUSED (stride_mask); GGML_UNUSED (tile_K);
775- GGML_UNUSED (tile_V); GGML_UNUSED (tile_mask); GGML_UNUSED (Q_B);
776- GGML_UNUSED (VKQ_C); GGML_UNUSED (KQ_max); GGML_UNUSED (KQ_rowsum);
777- GGML_UNUSED (kb0); GGML_UNUSED (tile_Q);
770+ GGML_UNUSED_VARS (Q_f2, K_h2, V_h2, mask_h2, dstk, dstk_fixup,
771+ scale, slope, logit_softcap, ne01, ne02,
772+ stride_K, stride_V, stride_mask,
773+ tile_Q, tile_K, tile_V, tile_mask,
774+ Q_B, VKQ_C, KQ_max, KQ_rowsum, kb0);
778775 NO_DEVICE_CODE;
779776#endif // TURING_MMA_AVAILABLE
780777}
@@ -1236,14 +1233,10 @@ static __device__ __forceinline__ void flash_attn_ext_f16_process_tile(
12361233 }
12371234 }
12381235#else
1239- GGML_UNUSED (Q_f2); GGML_UNUSED (K_h2); GGML_UNUSED (V_h2);
1240- GGML_UNUSED (mask_h2); GGML_UNUSED (sinks_f);
1241- GGML_UNUSED (dstk); GGML_UNUSED (dstk_fixup);
1242- GGML_UNUSED (scale); GGML_UNUSED (slope); GGML_UNUSED (logit_softcap);
1243- GGML_UNUSED (ne01); GGML_UNUSED (ne02);
1244- GGML_UNUSED (stride_Q1); GGML_UNUSED (stride_Q2);
1245- GGML_UNUSED (stride_K); GGML_UNUSED (stride_V); GGML_UNUSED (stride_mask);
1246- GGML_UNUSED (jt); GGML_UNUSED (kb0_start); GGML_UNUSED (kb0_stop);
1236+ GGML_UNUSED_VARS (Q_f2, K_h2, V_h2, mask_h2, sinks_f, dstk, dstk_fixup,
1237+ scale, slope, logit_softcap, ne01, ne02,
1238+ stride_Q1, stride_Q2, stride_K, stride_V, stride_mask,
1239+ jt, kb0_start, kb0_stop);
12471240 NO_DEVICE_CODE;
12481241#endif // TURING_MMA_AVAILABLE
12491242}
@@ -1397,17 +1390,15 @@ static __global__ void flash_attn_ext_f16(
13971390 (Q_f2, K_h2, V_h2, mask_h2, sinks_f, dstk, dst_meta, scale, slope, logit_softcap,
13981391 ne01, ne02, stride_Q1, stride_Q2, stride_K, stride_V, stride_mask, jt, kb0_start_kernel, kb0_stop_kernel);
13991392#else
1400- GGML_UNUSED (Q); GGML_UNUSED (K); GGML_UNUSED (V); GGML_UNUSED (mask);
1401- GGML_UNUSED (sinks); GGML_UNUSED (KV_max); GGML_UNUSED (dst); GGML_UNUSED (dst_meta);
1402- GGML_UNUSED (scale); GGML_UNUSED (max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
1403- GGML_UNUSED (n_head_log2); GGML_UNUSED (logit_softcap);
1404- GGML_UNUSED (ne00); GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (ne03);
1405- GGML_UNUSED (nb01); GGML_UNUSED (nb02); GGML_UNUSED (nb03);
1406- GGML_UNUSED (ne10); GGML_UNUSED (ne11); GGML_UNUSED (ne12); GGML_UNUSED (ne13);
1407- GGML_UNUSED (nb11); GGML_UNUSED (nb12); GGML_UNUSED (nb13);
1408- GGML_UNUSED (nb21); GGML_UNUSED (nb22); GGML_UNUSED (nb23);
1409- GGML_UNUSED (ne31); GGML_UNUSED (ne32); GGML_UNUSED (ne33);
1410- GGML_UNUSED (nb31); GGML_UNUSED (nb32); GGML_UNUSED (nb33);
1393+ GGML_UNUSED_VARS (Q, K, V, mask, sinks, KV_max, dst, dst_meta, scale,
1394+ max_bias, m0, m1, n_head_log2, logit_softcap,
1395+ ne00, ne01, ne02, ne03,
1396+ nb01, nb02, nb03,
1397+ ne10, ne11, ne12, ne13,
1398+ nb11, nb12, nb13,
1399+ nb21, nb22, nb23,
1400+ ne31, ne32, ne33,
1401+ nb31, nb32, nb33);
14111402 NO_DEVICE_CODE;
14121403#endif // defined(FLASH_ATTN_AVAILABLE) && defined(TURING_MMA_AVAILABLE)
14131404}
0 commit comments