Skip to content

Commit bc00169

Browse files
authored
Merge branch 'ikawrakow:main' into main
2 parents 0e9059d + 0ba5424 commit bc00169

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cuda/cpy.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -336,7 +336,7 @@ static void ggml_cpy_f32_q6_0_cuda(
336336
const int nb03, const int ne10, const int ne11, const int ne12, const int nb10, const int nb11, const int nb12, const int nb13, cudaStream_t stream, char ** cdst_indirect, int & graph_cpynode_index) {
337337

338338
GGML_ASSERT(ne % QK6_0 == 0);
339-
const int num_blocks = ne / QK5_1;
339+
const int num_blocks = ne / QK6_0;
340340
cpy_f32_q<cpy_blck_f32_q6_0, QK6_0><<<num_blocks, 1, 0, stream>>>
341341
(cx, cdst, ne, ne00, ne01, ne02, nb00, nb01, nb02, nb03, ne10, ne11, ne12, nb10, nb11, nb12, nb13, cdst_indirect, graph_cpynode_index++);
342342
}
@@ -590,7 +590,7 @@ void* ggml_cuda_cpy_fn(const ggml_tensor * src0, ggml_tensor * src1) {
590590
} else if (src0->type == GGML_TYPE_F32 && src1->type == GGML_TYPE_Q6_0) {
591591
return (void*) cpy_f32_q<cpy_blck_f32_q6_0, QK6_0>;
592592
} else if (src0->type == GGML_TYPE_Q6_0 && src1->type == GGML_TYPE_F32) {
593-
return (void*) cpy_q_f32<cpy_blck_q_f32<dequantize_q6_0, QK6_0>, QK5_1>;
593+
return (void*) cpy_q_f32<cpy_blck_q_f32<dequantize_q6_0, QK6_0>, QK6_0>;
594594
} else if (src0->type == GGML_TYPE_F16 && src1->type == GGML_TYPE_F16) {
595595
return (void*) cpy_flt<cpy_1_flt<half, half>>;
596596
} else if (src0->type == GGML_TYPE_F16 && src1->type == GGML_TYPE_BF16) {

0 commit comments

Comments
 (0)