We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 003b9f7 commit 2d5accaCopy full SHA for 2d5acca
ggml/src/ggml-cuda/mmq.cuh
@@ -2570,9 +2570,9 @@ static __device__ void mul_mat_q_process_tile(
2570
2571
template <ggml_type type, int mmq_x, int nwarps, bool need_check>
2572
#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
2573
-#if defined(RDNA3) || defined(RDNA2) || defined(CDNA)
+#if defined(RDNA3) || defined(RDNA2) || defined(CDNA) || defined(GCN)
2574
__launch_bounds__(WARP_SIZE*nwarps, 2)
2575
-#endif // defined(RDNA3) || defined(RDNA2)
+#endif // defined(RDNA3) || defined(RDNA2) || defined(CDNA) || defined(GCN)
2576
#else
2577
#if __CUDA_ARCH__ >= CC_VOLTA
2578
__launch_bounds__(WARP_SIZE*nwarps, 1)
0 commit comments