Skip to content

Commit cc091f8

Browse files
netrunnereve0cc4m
andauthored
Update ggml/src/ggml-vulkan/ggml-vulkan.cpp
Co-authored-by: 0cc4m <[email protected]>
1 parent 54b0053 commit cc091f8

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1741,8 +1741,9 @@ static void ggml_vk_load_shaders(vk_device& device) {
17411741
s_warptile_mmq_int = { subgroup_size_32, 32, 32, 32, 32, 32, 2, 2, 1, 1, subgroup_size_8 };
17421742

17431743
// chip specific tuning
1744-
if (device->architecture == AMD_GCN)
1745-
m_warptile_mmq = { 256, 64, 64, 32, 16, 16, 2, 2, tn_m, tk_m, 16 };
1744+
if (device->architecture == AMD_GCN) {
1745+
m_warptile_mmq = m_warptile_mmq_int = { 256, 64, 64, 32, 16, 16, 2, 2, 2, 1, 16 };
1746+
}
17461747

17471748
l_mmq_wg_denoms = l_wg_denoms = {128, 128, 1 };
17481749
m_mmq_wg_denoms = m_wg_denoms = { 64, 64, 1 };

0 commit comments

Comments
 (0)