Skip to content

Commit 3978014

Browse files
matmul-int8: fixed typos in q8_0_q8_0 matmuls
Co-authored-by: Georgi Gerganov <[email protected]>
1 parent e838a3d commit 3978014

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

ggml-quants.c

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -4838,18 +4838,18 @@ void ggml_vec_dot_q8_0_q8_0(int n, float * restrict s, size_t bs, const void * r
48384838

48394839
#if defined(__ARM_FEATURE_MATMUL_INT8)
48404840
if (nrc == 2) {
4841-
const block_q4_0 * restrict vx0 = vx;
4842-
const block_q4_0 * restrict vx1 = (const block_q4_0 *) ((const uint8_t*)vx + bx);
4841+
const block_q8_0 * restrict vx0 = vx;
4842+
const block_q8_0 * restrict vx1 = (const block_q8_0 *) ((const uint8_t*)vx + bx);
48434843
const block_q8_0 * restrict vy0 = vy;
48444844
const block_q8_0 * restrict vy1 = (const block_q8_0 *) ((const uint8_t*)vy + by);
48454845

48464846
float32x4_t sumv0 = vdupq_n_f32(0.0f);
48474847

48484848
for (int i = 0; i < nb; i++) {
4849-
const block_q4_0 * restrict b_x0 = &vx0[i];
4849+
const block_q8_0 * restrict b_x0 = &vx0[i];
48504850
const block_q8_0 * restrict b_y0 = &vy0[i];
48514851

4852-
const block_q4_0 * restrict b_x1 = &vx1[i];
4852+
const block_q8_0 * restrict b_x1 = &vx1[i];
48534853
const block_q8_0 * restrict b_y1 = &vy1[i];
48544854

48554855
const int8x16_t x0_l = vld1q_s8((const int8_t*)b_x0->qs);

0 commit comments

Comments
 (0)