7676#define  GGML_CUDA_CC_IS_CDNA (cc )  (cc >= GGML_CUDA_CC_CDNA && cc < GGML_CUDA_CC_RDNA1)
7777
7878//  Moore Threads
79- #define  GGML_CUDA_MUSA_ARCH_IS_QY1  (__MUSA_ARCH__ <= 210 )
80- 
8179#define  GGML_CUDA_CC_QY1   (GGML_CUDA_CC_OFFSET_MTHREADS + 0x210 ) //  MTT S80, MTT S3000
8280#define  GGML_CUDA_CC_QY2   (GGML_CUDA_CC_OFFSET_MTHREADS + 0x220 ) //  MTT S4000
8381#define  GGML_CUDA_CC_NG    (GGML_CUDA_CC_OFFSET_MTHREADS + 0x310 ) //  TBD
@@ -215,9 +213,9 @@ typedef float2 dfloat2;
215213#define  FP16_MMA_AVAILABLE 
216214#endif  //  defined(GGML_HIP_ROCWMMA_FATTN) && (defined(CDNA) || defined(RDNA3) || defined(RDNA4))
217215
218- #if  defined(GGML_USE_MUSA) && !GGML_CUDA_MUSA_ARCH_IS_QY1 
216+ #if  defined(GGML_USE_MUSA) && __MUSA_ARCH__ >= 220 
219217#define  FP16_MMA_AVAILABLE 
220- #endif  //  defined(GGML_USE_MUSA) && !GGML_CUDA_MUSA_ARCH_IS_QY1 
218+ #endif  //  defined(GGML_USE_MUSA) && __MUSA_ARCH__ >= 220 
221219
222220#if  !(defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) && __CUDA_ARCH__ >= GGML_CUDA_CC_TURING
223221#define  NEW_MMA_AVAILABLE 
@@ -227,9 +225,9 @@ typedef float2 dfloat2;
227225#define  CP_ASYNC_AVAILABLE 
228226#endif  //  !(defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)) && __CUDA_ARCH__ >= GGML_CUDA_CC_AMPERE
229227
230- #if  !defined(GGML_CUDA_NO_FA) && !(defined(GGML_USE_MUSA) && GGML_CUDA_MUSA_ARCH_IS_QY1 )
228+ #if  !defined(GGML_CUDA_NO_FA) && !(defined(GGML_USE_MUSA) && __MUSA_ARCH__ < 220 )
231229#define  FLASH_ATTN_AVAILABLE 
232- #endif  //  !defined(GGML_CUDA_NO_FA) && !(defined(GGML_USE_MUSA) && GGML_CUDA_MUSA_ARCH_IS_QY1 )
230+ #endif  //  !defined(GGML_CUDA_NO_FA) && !(defined(GGML_USE_MUSA) && __MUSA_ARCH__ < 220 )
233231
234232static  bool  fp16_available (const  int  cc) {
235233    return  ggml_cuda_highest_compiled_arch (cc) >= GGML_CUDA_CC_PASCAL;
0 commit comments