Skip to content

Commit 2d5acca

Browse files
committed
ggml_cuda: set launch bounds also for GCN as it helps there too
1 parent 003b9f7 commit 2d5acca

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/mmq.cuh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2570,9 +2570,9 @@ static __device__ void mul_mat_q_process_tile(
25702570

25712571
template <ggml_type type, int mmq_x, int nwarps, bool need_check>
25722572
#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
2573-
#if defined(RDNA3) || defined(RDNA2) || defined(CDNA)
2573+
#if defined(RDNA3) || defined(RDNA2) || defined(CDNA) || defined(GCN)
25742574
__launch_bounds__(WARP_SIZE*nwarps, 2)
2575-
#endif // defined(RDNA3) || defined(RDNA2)
2575+
#endif // defined(RDNA3) || defined(RDNA2) || defined(CDNA) || defined(GCN)
25762576
#else
25772577
#if __CUDA_ARCH__ >= CC_VOLTA
25782578
__launch_bounds__(WARP_SIZE*nwarps, 1)

0 commit comments

Comments
 (0)