We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5d09cb2 commit 1191c82Copy full SHA for 1191c82
ggml/src/ggml-metal/ggml-metal.m
@@ -1194,7 +1194,7 @@ static bool ggml_metal_supports_op(const struct ggml_backend_metal_device_contex
1194
case GGML_OP_SUM_ROWS:
1195
case GGML_OP_SOFT_MAX:
1196
case GGML_OP_GROUP_NORM:
1197
- return has_simdgroup_reduction;
+ return has_simdgroup_reduction && (op->ne[0] % 4 == 0 && ggml_is_contiguous_1(op->src[0]));
1198
case GGML_OP_RMS_NORM:
1199
return has_simdgroup_reduction && (op->ne[0] % 4 == 0);
1200
case GGML_OP_ARGMAX:
0 commit comments