We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2625283 commit e52a0f2Copy full SHA for e52a0f2
ggml/src/ggml-vulkan/ggml-vulkan.cpp
@@ -1404,10 +1404,10 @@ static void ggml_vk_load_shaders(vk_device& device) {
1404
// spec constants and tile sizes for non-quant matmul/matmul_id
1405
l_warptile = { 256, 128, 256, 64 };
1406
m_warptile = { 256, 128, 128, 64 };
1407
- s_warptile = { 128, 32, 16, 64 };
+ s_warptile = { 128, 64, 64, 64 };
1408
l_wg_denoms = {128, 256, 1 };
1409
m_wg_denoms = {128, 128, 1 };
1410
- s_wg_denoms = { 32, 16, 1 };
+ s_wg_denoms = { 64, 64, 1 };
1411
1412
// spec constants and tile sizes for quant matmul (non-Qi_K)
1413
l_warptile_mmq = { 256, 128, 256, 64 };
0 commit comments