Skip to content

Commit a5aa1f3

Browse files
committed
Helper files.
1 parent 1318b76 commit a5aa1f3

18 files changed

+40206
-51
lines changed

ggml/src/ggml-common_ik.h_

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -386,10 +386,11 @@ static_assert(sizeof(block_q6_k_r4) == 4*sizeof(ggml_half) + QK_K/4 + 3*QK_K, "w
386386
// This is only used for intermediate quantization and dot products
387387
typedef struct {
388388
float d; // delta
389+
float sum; // sum of quants in the entire block
389390
int8_t qs[QK_K]; // quants
390391
int16_t bsums[QK_K/16]; // sum of quants in groups of 16
391392
} block_q8_K;
392-
static_assert(sizeof(block_q8_K) == sizeof(float) + QK_K + QK_K/16*sizeof(int16_t), "wrong q8_K block size/padding");
393+
static_assert(sizeof(block_q8_K) == 2*sizeof(float) + QK_K + QK_K/16*sizeof(int16_t), "wrong q8_K block size/padding");
393394
typedef struct {
394395
float d; // delta
395396
int8_t qs[64]; // quants

0 commit comments

Comments
 (0)