We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f763866 commit f18ad77Copy full SHA for f18ad77
ggml/src/ggml-cuda/ggml-cuda.cu
@@ -1216,6 +1216,7 @@ static void ggml_cuda_op_mul_mat_cublas(
1216
1217
CUBLAS_CHECK(cublasSetStream(ctx.cublas_handle(id), stream));
1218
1219
+ const int compute_capability = ggml_cuda_info().devices[ctx.device].cc;
1220
if (GGML_CUDA_CC_IS_CDNA(compute_capability) || GGML_CUDA_CC_IS_RDNA4(compute_capability)) {
1221
const float alpha = 1.0f;
1222
const float beta = 0.0f;
0 commit comments