File tree Expand file tree Collapse file tree 1 file changed +2
-0
lines changed
Expand file tree Collapse file tree 1 file changed +2
-0
lines changed Original file line number Diff line number Diff line change 1010
1111template <int D, int ncols2>
1212static void ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1 (ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
13+ GGML_LOG_INFO (" ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1: D=%d, ncols2=%d" , D, ncols2);
1314 const ggml_tensor * Q = dst->src [0 ];
1415
1516 if (Q->ne [1 ] <= 8 /ncols2) {
@@ -32,6 +33,7 @@ static void ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1(ggml_backend_cuda_con
3233
3334template <int ncols2>
3435static void ggml_cuda_flash_attn_ext_mma_f16_switch_hs (ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
36+ GGML_LOG_INFO (" ggml_cuda_flash_attn_ext_mma_f16_switch_hs: ncols2=%d" , ncols2);
3537 const ggml_tensor * Q = dst->src [0 ];
3638
3739 switch (Q->ne [0 ]) {
You can’t perform that action at this time.
0 commit comments