We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ef01952 commit c4f1358Copy full SHA for c4f1358
ggml/src/ggml-cpu/arch/arm/repack.cpp
@@ -2086,8 +2086,6 @@ void ggml_gemm_q4_K_8x8_q8_K(int n,
2086
2087
constexpr int ncols_interleaved = 8;
2088
constexpr int blocklen = 8;
2089
- constexpr int q8_k_blocklen = 4;
2090
-
2091
2092
assert(n % qk == 0);
2093
assert(nr % 4 == 0);
@@ -2104,6 +2102,7 @@ void ggml_gemm_q4_K_8x8_q8_K(int n,
2104
2102
UNUSED(blocklen);
2105
2103
2106
#if ! ((defined(_MSC_VER)) && ! defined(__clang__)) && defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8)
+ constexpr int q8_k_blocklen = 4;
2107
const uint8x16_t m4b = vdupq_n_u8(0x0f);
2108
2109
// 8 accumulators: 2 row pairs × 4 col pairs
0 commit comments