We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 86d33ac commit 6afb592Copy full SHA for 6afb592
ggml/src/ggml-cuda/common.cuh
@@ -183,6 +183,8 @@ static constexpr bool new_mma_available(const int cc) {
183
static constexpr __device__ int ggml_cuda_get_physical_warp_size() {
184
#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
185
return __AMDGCN_WAVEFRONT_SIZE;
186
+#elif defined(GGML_USE_MUSA)
187
+ return 128;
188
#else
189
return 32;
190
#endif // defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
0 commit comments