Skip to content

Commit c7c4d65

Browse files
committed
Speed up KV in llamafile-bench
1 parent d2be732 commit c7c4d65

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

llama.cpp/llama-bench/llama-bench.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -265,8 +265,8 @@ static const cmd_params cmd_params_defaults = {
265265
/* n_pg */ {},
266266
/* n_batch */ {2048},
267267
/* n_ubatch */ {512},
268-
/* type_k */ {GGML_TYPE_F16},
269-
/* type_v */ {GGML_TYPE_F16},
268+
/* type_k */ {X86_HAVE(AVX512_BF16) ? GGML_TYPE_BF16 : GGML_TYPE_F16},
269+
/* type_v */ {X86_HAVE(AVX512_BF16) ? GGML_TYPE_BF16 : GGML_TYPE_F16},
270270
/* n_threads */ {cpu_get_num_math()},
271271
/* n_gpu_layers */ {0},
272272
/* split_mode */ {LLAMA_SPLIT_MODE_LAYER},

0 commit comments

Comments
 (0)