Skip to content

Commit 69b7db8

Browse files
committed
vulkan: fix noncontig check for mat_mul_id splitting
Remove supports_op check for > 4096 (splitting fixes this)
1 parent bdca383 commit 69b7db8

File tree

1 file changed

+1
-5
lines changed

1 file changed

+1
-5
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -4916,7 +4916,7 @@ static bool ggml_vk_dim01_contiguous(const ggml_tensor * tensor) {
49164916
return
49174917
tensor->nb[0] == ggml_type_size(tensor->type) &&
49184918
tensor->nb[1] == (tensor->nb[0]*tensor->ne[0])/ggml_blck_size(tensor->type) &&
4919-
tensor->nb[3] == tensor->nb[2]*tensor->ne[2];
4919+
(tensor->ne[3] == 1 || tensor->nb[3] == tensor->nb[2]*tensor->ne[2]);
49204920
}
49214921

49224922
static vk_pipeline ggml_vk_get_cpy_pipeline(ggml_backend_vk_context * ctx, const ggml_tensor * src, const ggml_tensor * dst, ggml_type to) {
@@ -10350,10 +10350,6 @@ static bool ggml_backend_vk_device_supports_op(ggml_backend_dev_t dev, const ggm
1035010350
// If there's not enough shared memory for row_ids and the result tile, fallback to CPU
1035110351
return false;
1035210352
}
10353-
// Check against size of shared memory variable
10354-
if (op->src[2]->ne[0] > 4096) {
10355-
return false;
10356-
}
1035710353
}
1035810354
switch (src0_type) {
1035910355
case GGML_TYPE_F32:

0 commit comments

Comments
 (0)