Skip to content

Commit 1cc5037

Browse files
author
Huaishun Hu
committed
fixme: musa cc had to fallback to fix inference
1 parent e3c0041 commit 1cc5037

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

ggml/src/ggml-cuda/ggml-cuda.cu

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -179,11 +179,11 @@ static ggml_cuda_device_info ggml_cuda_init() {
179179
#if defined(GGML_USE_HIP) && defined(__HIP_PLATFORM_AMD__)
180180
info.devices[id].smpbo = prop.sharedMemPerBlock;
181181
info.devices[id].cc = 100*prop.major + 10*prop.minor + GGML_CUDA_CC_OFFSET_AMD;
182-
#elif defined(GGML_USE_MUSA)
183-
/** TODO: MUSA arch should match CUDA 11.4 */
184-
info.devices[id].smpbo = prop.sharedMemPerBlockOptin;
185-
// info.devices[id].cc = 100*prop.major + 10*prop.minor + CC_OFFSET_MT;
186-
info.devices[id].cc = __MUSA_CC__;
182+
// #elif defined(GGML_USE_MUSA)
183+
// /** TODO: MUSA arch should match CUDA 11.4 */
184+
// info.devices[id].smpbo = prop.sharedMemPerBlockOptin;
185+
// // info.devices[id].cc = 100*prop.major + 10*prop.minor + CC_OFFSET_MT;
186+
// info.devices[id].cc = __MUSA_CC__;
187187
#else
188188
info.devices[id].smpbo = prop.sharedMemPerBlockOptin;
189189
info.devices[id].cc = 100*prop.major + 10*prop.minor;

0 commit comments

Comments
 (0)