@@ -61,16 +61,16 @@ enum mmvq_parameter_table_id {
6161 MMVQ_PARAMETERS_GENERIC = 0 ,
6262 MMVQ_PARAMETERS_GCN,
6363 MMVQ_PARAMETERS_RDNA2,
64- MMVQ_PARAMETERS_RDNA3 ,
64+ MMVQ_PARAMETERS_RDNA3_0 ,
6565 MMVQ_PARAMETERS_RDNA4
6666};
6767
6868static constexpr __device__ mmvq_parameter_table_id get_device_table_id () {
6969#if defined(RDNA4)
7070 return MMVQ_PARAMETERS_RDNA4;
71- #elif defined(RDNA3 )
72- return MMVQ_PARAMETERS_RDNA3 ;
73- #elif defined(RDNA2)
71+ #elif defined(RDNA3_0 )
72+ return MMVQ_PARAMETERS_RDNA3_0 ;
73+ #elif defined(RDNA2) || defined(RDNA3_5)
7474 return MMVQ_PARAMETERS_RDNA2;
7575#elif defined(GCN) || defined(CDNA)
7676 return MMVQ_PARAMETERS_GCN;
@@ -83,10 +83,10 @@ static __host__ mmvq_parameter_table_id get_device_table_id(int cc) {
8383 if (GGML_CUDA_CC_IS_RDNA4 (cc)) {
8484 return MMVQ_PARAMETERS_RDNA4;
8585 }
86- if (GGML_CUDA_CC_IS_RDNA3 (cc)) {
87- return MMVQ_PARAMETERS_RDNA3 ;
86+ if (GGML_CUDA_CC_IS_RDNA3_0 (cc)) {
87+ return MMVQ_PARAMETERS_RDNA3_0 ;
8888 }
89- if (GGML_CUDA_CC_IS_RDNA2 (cc)) {
89+ if (GGML_CUDA_CC_IS_RDNA2 (cc) || GGML_CUDA_CC_IS_RDNA3_5 (cc) ) {
9090 return MMVQ_PARAMETERS_RDNA2;
9191 }
9292 if (GGML_CUDA_CC_IS_GCN (cc) || GGML_CUDA_CC_IS_CDNA (cc)) {
@@ -150,7 +150,7 @@ static constexpr __host__ __device__ int calc_nwarps(ggml_type type, int ncols_d
150150 }
151151 return 1 ;
152152 }
153- if (table_id == MMVQ_PARAMETERS_RDNA3 ) {
153+ if (table_id == MMVQ_PARAMETERS_RDNA3_0 ) {
154154 // RDNA3 (W7900): stricter whitelist than RDNA4.
155155 // Q2_K / Q5_K / IQ4_XS regress in full quant sweeps.
156156 if (ncols_dst == 1 ) {
0 commit comments