We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0b1fec6 commit c14e3e4Copy full SHA for c14e3e4
ggml/src/ggml-cpu/arch/arm/repack.cpp
@@ -2260,7 +2260,6 @@ void ggml_gemm_q4_K_8x8_q8_K(int n,
2260
2261
for (int i = 0; i < q8_k_blocklen; i++) {
2262
for (int j = 0; j < 2; j++) {
2263
- // TODO: Change to a single vmul
2264
float32x4_t q8_d = vdupq_n_f32(q8_ptr[b].d[i]);
2265
float32x4_t q4_dmin = vcvt_f32_f16(vld1_f16((const __fp16 *)(q4_ptr[b].dmin + j * 4)));
2266
const float32x4_t dmins = vmulq_f32(q4_dmin, q8_d);
0 commit comments