File tree Expand file tree Collapse file tree 2 files changed +0
-36
lines changed Expand file tree Collapse file tree 2 files changed +0
-36
lines changed Original file line number Diff line number Diff line change @@ -263,9 +263,7 @@ static ggml_cuda_device_info ggml_cuda_init() {
263263 device_vmm ? " yes" : " no" , prop.warpSize );
264264#elif defined(GGML_USE_MUSA)
265265 info.devices [id].smpbo = prop.sharedMemPerBlockOptin ;
266- /* * FIXME: MUSA arch should match CUDA 11.4 */
267266 info.devices [id].cc = 100 *prop.major + 10 *prop.minor ;
268- // info.devices[id].cc = __MUSA_CC__;
269267#else
270268 info.devices [id].smpbo = prop.sharedMemPerBlockOptin ;
271269 info.devices [id].cc = 100 *prop.major + 10 *prop.minor ;
Original file line number Diff line number Diff line change 135135#define cudaStreamEndCapture musaStreamEndCapture
136136
137137typedef mt_bfloat16 nv_bfloat16 ;
138-
139- /** FIXME: MUSA arch should match CUDA 11.4 */
140- // #define GGML_CUDA_CC_PASCAL 600
141- // #define GGML_CUDA_CC_DP4A 610
142- // #define GGML_CUDA_CC_VOLTA 700
143- // #define GGML_CUDA_CC_TURING 750
144- // #define GGML_CUDA_CC_AMPERE 800
145-
146- #define __MUSA_CC__ 610
147- // #define __CUDA_ARCH__ __MUSA_CC__
148-
149-
150- /** TODO: following apis not supported yet by musa sdk: ***********/
151-
152- // __device__ __half hexp(const __half a) {
153- // float f_a = __half2float(a);
154- // float f_result = expf(f_a);
155- // return __float2half(f_result);
156- // }
157-
158- // __host__ __device__ __half2 h2exp(const __half2 a) {
159- // // Extract lower and upper halves
160- // __half lower = __low2half(a);
161- // __half upper = __high2half(a);
162-
163- // // Compute exp for each half
164- // __half exp_lower = hexp(lower);
165- // __half exp_upper = hexp(upper);
166-
167- // // Combine back into __half2
168- // return __halves2half2(exp_lower, exp_upper);
169- // }
170-
171- /******************************************************************/
You can’t perform that action at this time.
0 commit comments