Skip to content

Commit 057e67c

Browse files
committed
opencl: use q8_0 mm for larger matrix
1 parent 5aa2835 commit 057e67c

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

ggml/src/ggml-opencl/ggml-opencl.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6980,6 +6980,9 @@ static void ggml_cl_mul_mat(ggml_backend_t backend, const ggml_tensor * src0, co
69806980
return;
69816981
}
69826982
case GGML_TYPE_Q8_0: {
6983+
if (ne11 < 32) {
6984+
break;
6985+
}
69836986
kernel = backend_ctx->kernel_mul_mm_q8_0_f32_l4_lm;
69846987
nth0 = 128; // calculated as (BM*BN)/(TM*TN)
69856988

0 commit comments

Comments
 (0)