Fix ARM_NEON build failure due to q8_2 (#303)

ikawrakow · Iwan Kawrakow · web-flow · commit 21a5b8bd2820 · 2025-04-01T13:48:20.000+02:00
Co-authored-by: Iwan Kawrakow &lt;iwan.kawrakow@gmail.com&gt;
diff --git a/ggml/src/ggml-alloc.c b/ggml/src/ggml-alloc.c
@@ -174,8 +174,8 @@ static size_t ggml_dyn_tallocr_alloc(struct ggml_dyn_tallocr * alloc, size_t siz
             // this should never happen
             fprintf(stderr, "%s: not enough space in the buffer to allocate %zu bytes, largest block available %zu bytes\n",
                     __func__, size, max_avail);
-            fprintf(stderr, "%s: tensor was %s with %zu elements and %zu bytes\n", __func__, tensor->name,
-                    ggml_nelements(tensor), ggml_nbytes(tensor));
+            fprintf(stderr, "%s: tensor was %s with %g elements and %zu bytes\n", __func__, tensor->name,
+                    1.*ggml_nelements(tensor), ggml_nbytes(tensor));
             GGML_ABORT("not enough space in the buffer");
         }
     }
diff --git a/ggml/src/iqk/iqk_quantize.cpp b/ggml/src/iqk/iqk_quantize.cpp
@@ -860,9 +860,9 @@ void quantize_row_q8_1_x4_T(const float * x, Block * y, int64_t k) {
             }
         } else {
             if (i < nb4) {
-                y4[i4].s[ir] = vaddvq_s32(accv);
+                y4[i4].d[ir+4] = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits;
             } else {
-                y[i].s = vaddvq_s32(accv);
+                y[i].s = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits;
             }
         }
     }

Original file line number	Diff line number	Diff line change
`@@ -174,8 +174,8 @@ static size_t ggml_dyn_tallocr_alloc(struct ggml_dyn_tallocr * alloc, size_t siz`
`174`	`174`	`// this should never happen`
`175`	`175`	`fprintf(stderr, "%s: not enough space in the buffer to allocate %zu bytes, largest block available %zu bytes\n",`
`176`	`176`	`__func__, size, max_avail);`
`177`		`- fprintf(stderr, "%s: tensor was %s with %zu elements and %zu bytes\n", __func__, tensor->name,`
`178`		`- ggml_nelements(tensor), ggml_nbytes(tensor));`
	`177`	`+ fprintf(stderr, "%s: tensor was %s with %g elements and %zu bytes\n", __func__, tensor->name,`
	`178`	`+ 1.*ggml_nelements(tensor), ggml_nbytes(tensor));`
`179`	`179`	`GGML_ABORT("not enough space in the buffer");`
`180`	`180`	`}`
`181`	`181`	`}`
Original file line number	Diff line number	Diff line change
`@@ -860,9 +860,9 @@ void quantize_row_q8_1_x4_T(const float * x, Block * y, int64_t k) {`
`860`	`860`	`}`
`861`	`861`	`} else {`
`862`	`862`	`if (i < nb4) {`
`863`		`- y4[i4].s[ir] = vaddvq_s32(accv);`
	`863`	`+ y4[i4].d[ir+4] = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits;`
`864`	`864`	`} else {`
`865`		`- y[i].s = vaddvq_s32(accv);`
	`865`	`+ y[i].s = GGML_FP32_TO_BF16(d * vaddvq_s32(accv)).bits;`
`866`	`866`	`}`
`867`	`867`	`}`
`868`	`868`	`}`