Skip to content

Commit 940817b

Browse files
committed
tune matmul for gcn
1 parent 2f74c35 commit 940817b

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1740,6 +1740,10 @@ static void ggml_vk_load_shaders(vk_device& device) {
17401740
m_warptile_mmq_int = { 128, 64, 64, 32, subgroup_size_8, 32, 2, 2, 2, 1, subgroup_size_8 };
17411741
s_warptile_mmq_int = { subgroup_size_32, 32, 32, 32, 32, 32, 2, 2, 1, 1, subgroup_size_8 };
17421742

1743+
// chip specific tuning
1744+
if (device->architecture == AMD_GCN)
1745+
m_warptile_mmq = { 256, 64, 64, 32, subgroup_size_8, 16, 2, 2, tn_m, tk_m, subgroup_size_8 };
1746+
17431747
l_mmq_wg_denoms = l_wg_denoms = {128, 128, 1 };
17441748
m_mmq_wg_denoms = m_wg_denoms = { 64, 64, 1 };
17451749
s_mmq_wg_denoms = s_wg_denoms = { 32, 32, 1 };

0 commit comments

Comments
 (0)