@@ -30,8 +30,10 @@ options:
3030 --delay <0...N> (seconds) delay between each test (default: 0)
3131 -o, --output <csv|json|jsonl|md|sql> output format printed to stdout (default: md)
3232 -oe, --output-err <csv|json|jsonl|md|sql> output format printed to stderr (default: none)
33+ --list-devices list available devices and exit
3334 -v, --verbose verbose output
3435 --progress print test progress indicators
36+ -rpc, --rpc <rpc_servers> register RPC devices (comma separated)
3537
3638test parameters:
3739 -m, --model <filename> (default: models/7B/ggml-model-q4_0.gguf)
@@ -48,11 +50,12 @@ test parameters:
4850 --cpu-strict <0|1> (default: 0)
4951 --poll <0...100> (default: 50)
5052 -ngl, --n-gpu-layers <n> (default: 99)
51- -rpc , --rpc <rpc_servers > (default: none )
53+ -ncmoe , --n-cpu-moe <n > (default: 0 )
5254 -sm, --split-mode <none|layer|row> (default: layer)
5355 -mg, --main-gpu <i> (default: 0)
5456 -nkvo, --no-kv-offload <0|1> (default: 0)
5557 -fa, --flash-attn <0|1> (default: 0)
58+ -dev, --device <dev0/dev1/...> (default: auto)
5659 -mmp, --mmap <0|1> (default: 1)
5760 -embd, --embeddings <0|1> (default: 0)
5861 -ts, --tensor-split <ts0/ts1/..> (default: 0)
0 commit comments