Skip to content

Commit c92b0cf

Browse files
committed
early merge ggml-org#12767 to test
1 parent 65cd25d commit c92b0cf

File tree

1 file changed

+4
-14
lines changed

1 file changed

+4
-14
lines changed

ggml/src/ggml-vulkan/ggml-vulkan.cpp

Lines changed: 4 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1745,19 +1745,9 @@ static void ggml_vk_load_shaders(vk_device& device) {
17451745
m_warptile_mmq = { 128, 64, 64, 32, subgroup_size_8, 32, 2, tm_m, tn_m, tk_m, subgroup_size_8 };
17461746
s_warptile_mmq = { subgroup_size_32, 32, 32, 32, 32, 32, 2, tm_s, tn_s, tk_s, subgroup_size_8 };
17471747

1748-
const uint32_t tm_int_l = device->coopmat_int_support ? device->coopmat_int_m : 4;
1749-
const uint32_t tm_int_m = device->coopmat_int_support ? device->coopmat_int_m : 4;
1750-
const uint32_t tm_int_s = device->coopmat_int_support ? device->coopmat_int_m : 2;
1751-
const uint32_t tn_int_l = device->coopmat_int_support ? device->coopmat_int_n : 4;
1752-
const uint32_t tn_int_m = device->coopmat_int_support ? device->coopmat_int_n : 2;
1753-
const uint32_t tn_int_s = device->coopmat_int_support ? device->coopmat_int_n : 2;
1754-
const uint32_t tk_int_l = device->coopmat_int_support ? device->coopmat_int_k : 1;
1755-
const uint32_t tk_int_m = device->coopmat_int_support ? device->coopmat_int_k : 1;
1756-
const uint32_t tk_int_s = device->coopmat_int_support ? device->coopmat_int_k : 1;
1757-
1758-
l_warptile_mmq_int = { 128, 128, 128, 32, subgroup_size_8 * 2, 64, 2, tm_int_l, tn_int_l, tk_int_l, subgroup_size_8 };
1759-
m_warptile_mmq_int = { 128, 64, 64, 32, subgroup_size_8, 32, 2, tm_int_m, tn_int_m, tk_int_m, subgroup_size_8 };
1760-
s_warptile_mmq_int = { subgroup_size_32, 32, 32, 32, 32, 32, 2, tm_int_s, tn_int_s, tk_int_s, subgroup_size_8 };
1748+
l_warptile_mmq_int = { 128, 128, 128, 32, subgroup_size_8 * 2, 64, 2, 4, 4, 1, subgroup_size_8 };
1749+
m_warptile_mmq_int = { 128, 64, 64, 32, subgroup_size_8, 32, 2, 2, 2, 1, subgroup_size_8 };
1750+
s_warptile_mmq_int = { subgroup_size_32, 32, 32, 32, 32, 32, 2, 2, 1, 1, subgroup_size_8 };
17611751

17621752
l_mmq_wg_denoms = l_wg_denoms = {128, 128, 1 };
17631753
m_mmq_wg_denoms = m_wg_denoms = { 64, 64, 1 };
@@ -7939,7 +7929,7 @@ static void ggml_vk_preallocate_buffers(ggml_backend_vk_context * ctx) {
79397929
128, 49, 49,
79407930
4096, 49, 4096,
79417931
};
7942-
const size_t num_it = 1;
7932+
const size_t num_it = 100;
79437933

79447934
ggml_vk_test_dequant_matmul(ctx, 4096, 512, 4096, 2, num_it, 1, 0, GGML_TYPE_Q4_0);
79457935
ggml_vk_test_dequant_matmul(ctx, 4096, 512, 4096, 2, num_it, 1, 1, GGML_TYPE_Q4_0);

0 commit comments

Comments
 (0)