Skip to content

Commit 66f4c93

Browse files
committed
CUDA/HIP: use mmv instead of rocblas for batch 3-5 mmv
1 parent 6a414d9 commit 66f4c93

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

ggml/src/ggml-cuda/mmv.cu

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -471,6 +471,9 @@ bool ggml_cuda_should_use_mmv(enum ggml_type type, int cc, const int64_t * src0_
471471
}
472472
return ne11 <= 8;
473473
} else if (fp16_mma_hardware_available(cc)) {
474+
if (GGML_CUDA_CC_IS_RDNA3(cc) || GGML_CUDA_CC_IS_RDNA4(cc)) {
475+
return ne11 <= 5;
476+
}
474477
return ne11 <= 2;
475478
}
476479
return ne11 <= 8;

0 commit comments

Comments
 (0)