We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 901e9d8 commit 12df4a7Copy full SHA for 12df4a7
scripts/compare-llama-bench.py
@@ -27,6 +27,7 @@
27
"model_type", "model_size", "model_n_params", "n_batch", "n_ubatch", "n_threads",
28
"cpu_mask", "cpu_strict", "poll", "type_k", "type_v", "n_gpu_layers",
29
"split_mode", "main_gpu", "no_kv_offload", "flash_attn", "tensor_split", "tensor_buft_overrides",
30
+ "defrag_thold",
31
"use_mmap", "embeddings", "no_op_offload", "n_prompt", "n_gen", "n_depth",
32
"test_time", "avg_ns", "stddev_ns", "avg_ts", "stddev_ts",
33
]
0 commit comments