Skip to content

Commit 34f4762

Browse files
committed
1
Signed-off-by: Xiaodong Ye <[email protected]>
1 parent f85dbd2 commit 34f4762

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/ggml-cuda.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3030,8 +3030,8 @@ static bool ggml_backend_cuda_device_supports_op(ggml_backend_dev_t dev, const g
30303030
const int cc = ggml_cuda_info().devices[dev_ctx->device].cc;
30313031
if (GGML_CUDA_CC_IS_MTHREADS(cc) && b->ne[2]*b->ne[3] > 1 &&
30323032
!ggml_is_transposed(a) && !ggml_is_transposed(b)) {
3033-
if (GGML_CUDA_CC_IS_QY1(cc) && op->op == GGML_OP_MUL_MAT
3034-
&& b->type == GGML_TYPE_F16) {
3033+
if (GGML_CUDA_CC_IS_QY1(cc) && op->op == GGML_OP_MUL_MAT &&
3034+
a->type == GGML_TYPE_F16 && b->type == GGML_TYPE_F16) {
30353035
return false;
30363036
}
30373037
if (GGML_CUDA_CC_IS_QY2(cc) && op->op == GGML_OP_MUL_MAT_ID &&

0 commit comments

Comments
 (0)