@@ -767,14 +767,11 @@ static __device__ __forceinline__ void flash_attn_ext_f16_iter(
767767        }
768768    }
769769#else 
770-     GGML_UNUSED (Q_f2); GGML_UNUSED (K_h2); GGML_UNUSED (V_h2);
771-     GGML_UNUSED (mask_h2); GGML_UNUSED (dstk); GGML_UNUSED (dstk_fixup);
772-     GGML_UNUSED (scale); GGML_UNUSED (slope); GGML_UNUSED (logit_softcap);
773-     GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (stride_K); GGML_UNUSED (stride_V);
774-     GGML_UNUSED (stride_mask); GGML_UNUSED (tile_K);
775-     GGML_UNUSED (tile_V); GGML_UNUSED (tile_mask); GGML_UNUSED (Q_B);
776-     GGML_UNUSED (VKQ_C); GGML_UNUSED (KQ_max); GGML_UNUSED (KQ_rowsum);
777-     GGML_UNUSED (kb0); GGML_UNUSED (tile_Q);
770+     GGML_UNUSED_VARS (Q_f2, K_h2, V_h2, mask_h2, dstk, dstk_fixup,
771+         scale, slope, logit_softcap, ne01, ne02,
772+         stride_K, stride_V, stride_mask,
773+         tile_Q, tile_K, tile_V, tile_mask,
774+         Q_B, VKQ_C, KQ_max, KQ_rowsum, kb0);
778775    NO_DEVICE_CODE;
779776#endif  //  TURING_MMA_AVAILABLE
780777}
@@ -1236,14 +1233,10 @@ static __device__ __forceinline__ void flash_attn_ext_f16_process_tile(
12361233        }
12371234    }
12381235#else 
1239-     GGML_UNUSED (Q_f2); GGML_UNUSED (K_h2); GGML_UNUSED (V_h2);
1240-     GGML_UNUSED (mask_h2); GGML_UNUSED (sinks_f);
1241-     GGML_UNUSED (dstk); GGML_UNUSED (dstk_fixup);
1242-     GGML_UNUSED (scale); GGML_UNUSED (slope); GGML_UNUSED (logit_softcap);
1243-     GGML_UNUSED (ne01); GGML_UNUSED (ne02);
1244-     GGML_UNUSED (stride_Q1); GGML_UNUSED (stride_Q2);
1245-     GGML_UNUSED (stride_K); GGML_UNUSED (stride_V); GGML_UNUSED (stride_mask);
1246-     GGML_UNUSED (jt); GGML_UNUSED (kb0_start); GGML_UNUSED (kb0_stop);
1236+     GGML_UNUSED_VARS (Q_f2, K_h2, V_h2, mask_h2, sinks_f, dstk, dstk_fixup,
1237+         scale, slope, logit_softcap, ne01, ne02,
1238+         stride_Q1, stride_Q2, stride_K, stride_V, stride_mask,
1239+         jt, kb0_start, kb0_stop);
12471240    NO_DEVICE_CODE;
12481241#endif  //  TURING_MMA_AVAILABLE
12491242}
@@ -1397,17 +1390,15 @@ static __global__ void flash_attn_ext_f16(
13971390        (Q_f2, K_h2, V_h2, mask_h2, sinks_f, dstk, dst_meta, scale, slope, logit_softcap,
13981391         ne01, ne02, stride_Q1, stride_Q2, stride_K, stride_V, stride_mask, jt, kb0_start_kernel, kb0_stop_kernel);
13991392#else 
1400-     GGML_UNUSED (Q); GGML_UNUSED (K); GGML_UNUSED (V); GGML_UNUSED (mask);
1401-     GGML_UNUSED (sinks); GGML_UNUSED (KV_max); GGML_UNUSED (dst); GGML_UNUSED (dst_meta);
1402-     GGML_UNUSED (scale); GGML_UNUSED (max_bias); GGML_UNUSED (m0); GGML_UNUSED (m1);
1403-     GGML_UNUSED (n_head_log2); GGML_UNUSED (logit_softcap);
1404-     GGML_UNUSED (ne00); GGML_UNUSED (ne01); GGML_UNUSED (ne02); GGML_UNUSED (ne03);
1405-     GGML_UNUSED (nb01); GGML_UNUSED (nb02); GGML_UNUSED (nb03);
1406-     GGML_UNUSED (ne10); GGML_UNUSED (ne11); GGML_UNUSED (ne12); GGML_UNUSED (ne13);
1407-     GGML_UNUSED (nb11); GGML_UNUSED (nb12); GGML_UNUSED (nb13);
1408-     GGML_UNUSED (nb21); GGML_UNUSED (nb22); GGML_UNUSED (nb23);
1409-     GGML_UNUSED (ne31); GGML_UNUSED (ne32); GGML_UNUSED (ne33);
1410-     GGML_UNUSED (nb31); GGML_UNUSED (nb32); GGML_UNUSED (nb33);
1393+     GGML_UNUSED_VARS (Q, K, V, mask, sinks, KV_max, dst, dst_meta, scale,
1394+         max_bias, m0, m1, n_head_log2, logit_softcap,
1395+         ne00, ne01, ne02, ne03,
1396+               nb01, nb02, nb03,
1397+         ne10, ne11, ne12, ne13,
1398+               nb11, nb12, nb13,
1399+               nb21, nb22, nb23,
1400+               ne31, ne32, ne33,
1401+               nb31, nb32, nb33);
14111402    NO_DEVICE_CODE;
14121403#endif  //  defined(FLASH_ATTN_AVAILABLE) && defined(TURING_MMA_AVAILABLE)
14131404}
0 commit comments