Skip to content

Commit 955706b

Browse files
author
zhouwg
committed
ggml-hexagon: try to offload q6_k mulmat to cDSP
1 parent 056aa4c commit 955706b

File tree

3 files changed

+1047
-289
lines changed

3 files changed

+1047
-289
lines changed

ggml/src/ggml-hexagon/ggml-hexagon.cpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5028,7 +5028,7 @@ static bool ggmlhexagon_can_handle_op_through_cdsp(ggml_backend_dev_t dev, const
50285028
//FIXME:remove this filter
50295029
if (ne00 < 32)
50305030
return false;
5031-
5031+
50325032
//FIXME:remove this filter
50335033
return ggmlhexagon_same_types(ctx, op_tensor);
50345034
}
@@ -5042,8 +5042,8 @@ static bool ggmlhexagon_can_handle_op_through_cdsp(ggml_backend_dev_t dev, const
50425042

50435043
ggmlhexagon_dump_op_info(op_tensor);
50445044
if (g_hexagon_appcfg.enable_q_mulmat)
5045-
return (src0->type == GGML_TYPE_F32 || ggml_is_quantized(src0->type))
5046-
&& (src1->type == GGML_TYPE_F32) && (op_tensor->type == GGML_TYPE_F32);
5045+
return (src0->type == GGML_TYPE_F32 || src0->type == GGML_TYPE_Q6_K
5046+
) && (src1->type == GGML_TYPE_F32) && (op_tensor->type == GGML_TYPE_F32);
50475047
else
50485048
return (src0->type == GGML_TYPE_F32) && (src1->type == GGML_TYPE_F32) && (op_tensor->type == GGML_TYPE_F32);
50495049
}

0 commit comments

Comments
 (0)