Skip to content

Commit a3aea08

Browse files
authored
rm_kq=2 by default
1 parent fa70739 commit a3aea08

File tree

1 file changed

+3
-6
lines changed

1 file changed

+3
-6
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1857,17 +1857,14 @@ static void ggml_vk_load_shaders(vk_device& device) {
18571857

18581858
// the number of rows computed per shader depends on GPU model and quant
18591859
uint32_t rm_stdq = 1;
1860-
uint32_t rm_kq = 1;
1860+
uint32_t rm_kq = 2;
18611861
if (device->vendor_id == VK_VENDOR_ID_AMD) {
18621862
if (device->subgroup_min_size == 64 && device->subgroup_max_size == 64) { // GCN
18631863
rm_stdq = 2;
18641864
rm_kq = 4;
1865-
} else // RDNA
1866-
rm_kq = 2;
1867-
} else if (device->vendor_id == VK_VENDOR_ID_INTEL) {
1865+
}
1866+
} else if (device->vendor_id == VK_VENDOR_ID_INTEL)
18681867
rm_stdq = 2;
1869-
rm_kq = 2;
1870-
}
18711868

18721869
ggml_vk_create_pipeline(device, device->pipeline_dequant_mul_mat_vec_f32_f32[GGML_TYPE_F32 ], "mul_mat_vec_f32_f32_f32", mul_mat_vec_f32_f32_f32_len, mul_mat_vec_f32_f32_f32_data, "main", 3, sizeof(vk_mat_vec_push_constants), {2, 1, 1}, {device->subgroup_size, 2}, 1);
18731870
ggml_vk_create_pipeline(device, device->pipeline_dequant_mul_mat_vec_f32_f32[GGML_TYPE_F16 ], "mul_mat_vec_f16_f32_f32", mul_mat_vec_f16_f32_f32_len, mul_mat_vec_f16_f32_f32_data, "main", 3, sizeof(vk_mat_vec_push_constants), {2, 1, 1}, {device->subgroup_size, 2}, 1);

0 commit comments

Comments
 (0)