Skip to content

Commit cfa4fc1

Browse files
committed
Move f32 get_rows from < 4 to % 4 != 0
1 parent 26742e2 commit cfa4fc1

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ggml/src/ggml-webgpu/ggml-webgpu.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -597,7 +597,7 @@ static void ggml_webgpu_get_rows(webgpu_context & ctx, ggml_tensor * src, ggml_t
597597
uint32_t wg_x = (dst->ne[1] * dst->ne[2] * dst->ne[3] + max_wg_size - 1) / max_wg_size;
598598

599599
wgpu::ComputePipeline pipeline = ctx->get_rows_pipeline[src->type];
600-
if (src->type == GGML_TYPE_F32 && dst->ne[0] < 4) {
600+
if (src->type == GGML_TYPE_F32 && dst->ne[0] % 4 != 0) {
601601
pipeline = ctx->get_rows_f32_no_vec_pipeline;
602602
}
603603
ggml_backend_webgpu_build_and_enqueue(ctx, pipeline, params, entries, wg_x, ggml_op_name(dst->op));

0 commit comments

Comments
 (0)