We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c14e3e4 commit 0b45665Copy full SHA for 0b45665
ggml/src/ggml-cpu/repack.cpp
@@ -1846,8 +1846,11 @@ static const ggml::cpu::tensor_traits * ggml_repack_get_optimal_repack_type(cons
1846
if (cur->ne[1] % 8 == 0) {
1847
return &q4_K_8x8_q8_K;
1848
}
1849
- } else if (ggml_cpu_has_neon() && ggml_cpu_has_matmul_int8()) {
1850
- return &q4_K_8x8_q8_K;
+ }
+ if (ggml_cpu_has_neon() && ggml_cpu_has_matmul_int8() && ggml_cpu_has_dotprod()) {
1851
+ if (cur->ne[1] % 8 == 0) {
1852
+ return &q4_K_8x8_q8_K;
1853
1854
1855
} else if (cur->type == GGML_TYPE_Q2_K) {
1856
if (ggml_cpu_has_avx512()) {
0 commit comments