Skip to content

Commit 44b1efa

Browse files
authored
tests: add performance test for mul mat id (ggml-org#15543)
1 parent a6a58d6 commit 44b1efa

File tree

1 file changed

+18
-0
lines changed

1 file changed

+18
-0
lines changed

tests/test-backend-ops.cpp

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6400,6 +6400,24 @@ static std::vector<std::unique_ptr<test_case>> make_test_cases_perf() {
64006400
}
64016401
}
64026402

6403+
// qwen3-30b-a3b
6404+
for (int bs : {1, 4, 8, 512}) {
6405+
for (ggml_type type_a : {GGML_TYPE_F32, GGML_TYPE_F16, GGML_TYPE_Q4_0, GGML_TYPE_Q8_0, GGML_TYPE_Q4_K, GGML_TYPE_Q6_K, GGML_TYPE_IQ2_XS}) {
6406+
for (ggml_type type_b : {GGML_TYPE_F32}) {
6407+
test_cases.emplace_back(new test_mul_mat_id(type_a, type_b, 128, 8, false, 768, bs, 2048, 1));
6408+
}
6409+
}
6410+
}
6411+
6412+
// gpt-oss-20b
6413+
for (int bs : {1, 4, 8, 512}) {
6414+
for (ggml_type type_a : {GGML_TYPE_MXFP4}) {
6415+
for (ggml_type type_b : {GGML_TYPE_F32}) {
6416+
test_cases.emplace_back(new test_mul_mat_id(type_a, type_b, 32, 4, false, 2880, bs, 2880, 1));
6417+
}
6418+
}
6419+
}
6420+
64036421
for (int K : {3, 5}) {
64046422
for (int IC : {256, 2560}) {
64056423
for (int IW_IH : {32, 64, 256}) {

0 commit comments

Comments
 (0)